diff --git "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" --- "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" +++ "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.2602, "train/learning_rate": 1.8408450704225354e-06, "train/epoch": 23.54, "train/global_step": 21000, "_runtime": 127314, "_timestamp": 1648268658, "_step": 21013, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 6.0, 5.0, 1.0, 5.0, 5.0, 9.0, 13.0, 17.0, 12.0, 19.0, 16.0, 34.0, 28.0, 25.0, 30.0, 37.0, 37.0, 35.0, 45.0, 46.0, 45.0, 44.0, 40.0, 41.0, 41.0, 33.0, 42.0, 30.0, 31.0, 28.0, 24.0, 31.0, 24.0, 17.0, 18.0, 18.0, 11.0, 14.0, 8.0, 7.0, 8.0, 6.0, 7.0, 5.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-44.89548873901367, -43.69374465942383, -42.49199676513672, -41.290252685546875, -40.088504791259766, -38.88676071166992, -37.68501281738281, -36.48326873779297, -35.281524658203125, -34.07978057861328, -32.87803268432617, -31.676286697387695, -30.47454071044922, -29.272796630859375, -28.0710506439209, -26.869304656982422, -25.667556762695312, -24.465810775756836, -23.26406478881836, -22.062318801879883, -20.860572814941406, -19.658828735351562, -18.457082748413086, -17.25533676147461, -16.053590774536133, -14.851844787597656, -13.65009880065918, -12.44835376739502, -11.246607780456543, -10.044861793518066, -8.843116760253906, -7.64137077331543, -6.439628601074219, -5.237882614135742, -4.036137104034424, -2.8343913555145264, -1.632645606994629, -0.43089962005615234, 0.770845890045166, 1.9725914001464844, 3.174337387084961, 4.3760833740234375, 5.577828884124756, 6.779574394226074, 7.981320381164551, 9.183066368103027, 10.384811401367188, 11.586557388305664, 12.78830337524414, 13.990049362182617, 15.191795349121094, 16.39354133605957, 17.595287322998047, 18.79703140258789, 19.998777389526367, 21.200523376464844, 22.40226936340332, 23.604015350341797, 24.805761337280273, 26.00750732421875, 27.209251403808594, 28.410999298095703, 29.612743377685547, 30.814489364624023, 32.0162353515625]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 8.0, 5.0, 15.0, 17.0, 14.0, 10.0, 19.0, 19.0, 20.0, 35.0, 34.0, 33.0, 28.0, 31.0, 43.0, 28.0, 41.0, 33.0, 37.0, 45.0, 37.0, 40.0, 39.0, 43.0, 32.0, 43.0, 33.0, 32.0, 36.0, 29.0, 20.0, 15.0, 14.0, 9.0, 8.0, 14.0, 8.0, 4.0, 8.0, 2.0, 0.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.66038131713867, -35.51462173461914, -34.36886215209961, -33.22310256958008, -32.07734298706055, -30.931583404541016, -29.78582191467285, -28.64006233215332, -27.49430274963379, -26.348543167114258, -25.202783584594727, -24.057024002075195, -22.91126251220703, -21.7655029296875, -20.61974334716797, -19.473983764648438, -18.328224182128906, -17.182464599609375, -16.036705017089844, -14.890944480895996, -13.745184898376465, -12.599425315856934, -11.453664779663086, -10.307905197143555, -9.162145614624023, -8.016386032104492, -6.870625972747803, -5.724865913391113, -4.579106330871582, -3.433346748352051, -2.2875866889953613, -1.1418266296386719, 0.003932952880859375, 1.1496927738189697, 2.29545259475708, 3.4412124156951904, 4.586972236633301, 5.732731819152832, 6.8784918785095215, 8.024251937866211, 9.170011520385742, 10.315771102905273, 11.461530685424805, 12.607291221618652, 13.753050804138184, 14.898810386657715, 16.044570922851562, 17.190330505371094, 18.336090087890625, 19.481849670410156, 20.627609252929688, 21.77336883544922, 22.91912841796875, 24.06488800048828, 25.210649490356445, 26.356409072875977, 27.502168655395508, 28.64792823791504, 29.79368782043457, 30.9394474029541, 32.085208892822266, 33.2309684753418, 34.37672805786133, 35.52248764038086, 36.66824722290039]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 5.0, 20.0, 25.0, 54.0, 70.0, 111.0, 183.0, 306.0, 535.0, 881.0, 1461.0, 2393.0, 4077.0, 6590.0, 11257.0, 18929.0, 31295.0, 52555.0, 87366.0, 146278.0, 241882.0, 390815.0, 590865.0, 731247.0, 663770.0, 468594.0, 294610.0, 179111.0, 107093.0, 65001.0, 38540.0, 23214.0, 14009.0, 8512.0, 4935.0, 2941.0, 1865.0, 1120.0, 699.0, 433.0, 248.0, 143.0, 90.0, 53.0, 44.0, 22.0, 8.0, 13.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-52.0, -50.24951171875, -48.4990234375, -46.74853515625, -44.998046875, -43.24755859375, -41.4970703125, -39.74658203125, -37.99609375, -36.24560546875, -34.4951171875, -32.74462890625, -30.994140625, -29.24365234375, -27.4931640625, -25.74267578125, -23.9921875, -22.24169921875, -20.4912109375, -18.74072265625, -16.990234375, -15.23974609375, -13.4892578125, -11.73876953125, -9.98828125, -8.23779296875, -6.4873046875, -4.73681640625, -2.986328125, -1.23583984375, 0.5146484375, 2.26513671875, 4.015625, 5.76611328125, 7.5166015625, 9.26708984375, 11.017578125, 12.76806640625, 14.5185546875, 16.26904296875, 18.01953125, 19.77001953125, 21.5205078125, 23.27099609375, 25.021484375, 26.77197265625, 28.5224609375, 30.27294921875, 32.0234375, 33.77392578125, 35.5244140625, 37.27490234375, 39.025390625, 40.77587890625, 42.5263671875, 44.27685546875, 46.02734375, 47.77783203125, 49.5283203125, 51.27880859375, 53.029296875, 54.77978515625, 56.5302734375, 58.28076171875, 60.03125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 7.0, 15.0, 19.0, 13.0, 12.0, 15.0, 15.0, 24.0, 11.0, 19.0, 15.0, 31.0, 35.0, 25.0, 29.0, 23.0, 44.0, 29.0, 25.0, 41.0, 41.0, 30.0, 30.0, 41.0, 29.0, 31.0, 42.0, 31.0, 42.0, 25.0, 28.0, 24.0, 21.0, 14.0, 26.0, 10.0, 15.0, 11.0, 6.0, 6.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 6.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-33.46875, -32.41650390625, -31.3642578125, -30.31201171875, -29.259765625, -28.20751953125, -27.1552734375, -26.10302734375, -25.05078125, -23.99853515625, -22.9462890625, -21.89404296875, -20.841796875, -19.78955078125, -18.7373046875, -17.68505859375, -16.6328125, -15.58056640625, -14.5283203125, -13.47607421875, -12.423828125, -11.37158203125, -10.3193359375, -9.26708984375, -8.21484375, -7.16259765625, -6.1103515625, -5.05810546875, -4.005859375, -2.95361328125, -1.9013671875, -0.84912109375, 0.203125, 1.25537109375, 2.3076171875, 3.35986328125, 4.412109375, 5.46435546875, 6.5166015625, 7.56884765625, 8.62109375, 9.67333984375, 10.7255859375, 11.77783203125, 12.830078125, 13.88232421875, 14.9345703125, 15.98681640625, 17.0390625, 18.09130859375, 19.1435546875, 20.19580078125, 21.248046875, 22.30029296875, 23.3525390625, 24.40478515625, 25.45703125, 26.50927734375, 27.5615234375, 28.61376953125, 29.666015625, 30.71826171875, 31.7705078125, 32.82275390625, 33.875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 15.0, 31.0, 52.0, 91.0, 134.0, 216.0, 402.0, 586.0, 1007.0, 1586.0, 2564.0, 4071.0, 6386.0, 9980.0, 16250.0, 25408.0, 40242.0, 63500.0, 98799.0, 151581.0, 227236.0, 326761.0, 446952.0, 549747.0, 572537.0, 496073.0, 376962.0, 266616.0, 180197.0, 118743.0, 77018.0, 48851.0, 31070.0, 19543.0, 12429.0, 7715.0, 4807.0, 3134.0, 1959.0, 1176.0, 703.0, 427.0, 305.0, 177.0, 99.0, 59.0, 34.0, 24.0, 12.0, 5.0, 5.0, 2.0, 1.0, 1.0], "bins": [-44.46875, -43.1689453125, -41.869140625, -40.5693359375, -39.26953125, -37.9697265625, -36.669921875, -35.3701171875, -34.0703125, -32.7705078125, -31.470703125, -30.1708984375, -28.87109375, -27.5712890625, -26.271484375, -24.9716796875, -23.671875, -22.3720703125, -21.072265625, -19.7724609375, -18.47265625, -17.1728515625, -15.873046875, -14.5732421875, -13.2734375, -11.9736328125, -10.673828125, -9.3740234375, -8.07421875, -6.7744140625, -5.474609375, -4.1748046875, -2.875, -1.5751953125, -0.275390625, 1.0244140625, 2.32421875, 3.6240234375, 4.923828125, 6.2236328125, 7.5234375, 8.8232421875, 10.123046875, 11.4228515625, 12.72265625, 14.0224609375, 15.322265625, 16.6220703125, 17.921875, 19.2216796875, 20.521484375, 21.8212890625, 23.12109375, 24.4208984375, 25.720703125, 27.0205078125, 28.3203125, 29.6201171875, 30.919921875, 32.2197265625, 33.51953125, 34.8193359375, 36.119140625, 37.4189453125, 38.71875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 3.0, 3.0, 9.0, 16.0, 14.0, 15.0, 22.0, 29.0, 32.0, 57.0, 63.0, 90.0, 85.0, 105.0, 130.0, 135.0, 159.0, 191.0, 197.0, 218.0, 261.0, 231.0, 223.0, 214.0, 224.0, 198.0, 166.0, 144.0, 135.0, 102.0, 101.0, 88.0, 82.0, 62.0, 59.0, 38.0, 31.0, 29.0, 24.0, 19.0, 11.0, 15.0, 14.0, 9.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.125, -16.55029296875, -15.9755859375, -15.40087890625, -14.826171875, -14.25146484375, -13.6767578125, -13.10205078125, -12.52734375, -11.95263671875, -11.3779296875, -10.80322265625, -10.228515625, -9.65380859375, -9.0791015625, -8.50439453125, -7.9296875, -7.35498046875, -6.7802734375, -6.20556640625, -5.630859375, -5.05615234375, -4.4814453125, -3.90673828125, -3.33203125, -2.75732421875, -2.1826171875, -1.60791015625, -1.033203125, -0.45849609375, 0.1162109375, 0.69091796875, 1.265625, 1.84033203125, 2.4150390625, 2.98974609375, 3.564453125, 4.13916015625, 4.7138671875, 5.28857421875, 5.86328125, 6.43798828125, 7.0126953125, 7.58740234375, 8.162109375, 8.73681640625, 9.3115234375, 9.88623046875, 10.4609375, 11.03564453125, 11.6103515625, 12.18505859375, 12.759765625, 13.33447265625, 13.9091796875, 14.48388671875, 15.05859375, 15.63330078125, 16.2080078125, 16.78271484375, 17.357421875, 17.93212890625, 18.5068359375, 19.08154296875, 19.65625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 4.0, 7.0, 10.0, 12.0, 10.0, 19.0, 17.0, 9.0, 18.0, 22.0, 34.0, 34.0, 29.0, 36.0, 36.0, 45.0, 39.0, 50.0, 34.0, 46.0, 34.0, 42.0, 57.0, 43.0, 33.0, 34.0, 35.0, 37.0, 33.0, 19.0, 30.0, 15.0, 15.0, 7.0, 9.0, 10.0, 11.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.735687255859375, -43.22833251953125, -41.72098159790039, -40.213626861572266, -38.706275939941406, -37.19892120361328, -35.691566467285156, -34.1842155456543, -32.67686462402344, -31.169511795043945, -29.662158966064453, -28.154804229736328, -26.64745330810547, -25.140098571777344, -23.63274574279785, -22.12539291381836, -20.618038177490234, -19.110685348510742, -17.60333251953125, -16.095977783203125, -14.58862590789795, -13.081273078918457, -11.573919296264648, -10.066566467285156, -8.559213638305664, -7.051860809326172, -5.5445075035095215, -4.037154197692871, -2.529801368713379, -1.0224485397338867, 0.4849052429199219, 1.992258071899414, 3.499614715576172, 5.006967544555664, 6.5143208503723145, 8.021674156188965, 9.529026985168457, 11.03637981414795, 12.543733596801758, 14.05108642578125, 15.558439254760742, 17.065792083740234, 18.573144912719727, 20.08049774169922, 21.587852478027344, 23.095203399658203, 24.602558135986328, 26.10991096496582, 27.617263793945312, 29.124616622924805, 30.631969451904297, 32.13932418823242, 33.64667510986328, 35.154029846191406, 36.66138458251953, 38.16873550415039, 39.67608642578125, 41.183441162109375, 42.690792083740234, 44.19814682006836, 45.70549774169922, 47.212852478027344, 48.72020721435547, 50.22755813598633, 51.73491287231445]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 7.0, 7.0, 5.0, 11.0, 16.0, 9.0, 16.0, 15.0, 21.0, 23.0, 31.0, 18.0, 29.0, 28.0, 28.0, 25.0, 36.0, 39.0, 42.0, 36.0, 25.0, 42.0, 35.0, 45.0, 47.0, 37.0, 46.0, 29.0, 36.0, 28.0, 22.0, 30.0, 15.0, 22.0, 19.0, 21.0, 14.0, 9.0, 7.0, 6.0, 8.0, 8.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.88594055175781, -40.551082611083984, -39.216224670410156, -37.88136672973633, -36.5465087890625, -35.211647033691406, -33.87678909301758, -32.54193115234375, -31.207073211669922, -29.872215270996094, -28.537357330322266, -27.202497482299805, -25.867639541625977, -24.53278160095215, -23.197921752929688, -21.86306381225586, -20.52820587158203, -19.193347930908203, -17.858489990234375, -16.523630142211914, -15.188772201538086, -13.853914260864258, -12.519055366516113, -11.184196472167969, -9.84933853149414, -8.514480590820312, -7.179621696472168, -5.844763278961182, -4.509904861450195, -3.175046443939209, -1.8401880264282227, -0.5053291320800781, 0.8295326232910156, 2.164391040802002, 3.4992494583129883, 4.834107875823975, 6.168966293334961, 7.503824710845947, 8.838683128356934, 10.173542022705078, 11.508399963378906, 12.843257904052734, 14.178116798400879, 15.512975692749023, 16.84783363342285, 18.18269157409668, 19.51755142211914, 20.85240936279297, 22.187267303466797, 23.522125244140625, 24.856983184814453, 26.191843032836914, 27.526700973510742, 28.86155891418457, 30.19641876220703, 31.53127670288086, 32.86613464355469, 34.200992584228516, 35.535850524902344, 36.87070846557617, 38.20556640625, 39.540428161621094, 40.87528610229492, 42.21014404296875, 43.54500198364258]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 8.0, 12.0, 21.0, 46.0, 65.0, 89.0, 165.0, 243.0, 385.0, 594.0, 980.0, 1501.0, 2298.0, 3597.0, 5189.0, 7964.0, 12068.0, 18326.0, 26508.0, 38911.0, 55060.0, 75003.0, 96890.0, 115257.0, 122612.0, 115548.0, 97279.0, 75425.0, 55421.0, 39369.0, 27604.0, 18229.0, 12541.0, 8117.0, 5420.0, 3489.0, 2248.0, 1479.0, 973.0, 597.0, 368.0, 232.0, 148.0, 109.0, 73.0, 34.0, 19.0, 10.0, 11.0, 6.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-49.75, -48.17138671875, -46.5927734375, -45.01416015625, -43.435546875, -41.85693359375, -40.2783203125, -38.69970703125, -37.12109375, -35.54248046875, -33.9638671875, -32.38525390625, -30.806640625, -29.22802734375, -27.6494140625, -26.07080078125, -24.4921875, -22.91357421875, -21.3349609375, -19.75634765625, -18.177734375, -16.59912109375, -15.0205078125, -13.44189453125, -11.86328125, -10.28466796875, -8.7060546875, -7.12744140625, -5.548828125, -3.97021484375, -2.3916015625, -0.81298828125, 0.765625, 2.34423828125, 3.9228515625, 5.50146484375, 7.080078125, 8.65869140625, 10.2373046875, 11.81591796875, 13.39453125, 14.97314453125, 16.5517578125, 18.13037109375, 19.708984375, 21.28759765625, 22.8662109375, 24.44482421875, 26.0234375, 27.60205078125, 29.1806640625, 30.75927734375, 32.337890625, 33.91650390625, 35.4951171875, 37.07373046875, 38.65234375, 40.23095703125, 41.8095703125, 43.38818359375, 44.966796875, 46.54541015625, 48.1240234375, 49.70263671875, 51.28125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 9.0, 7.0, 8.0, 13.0, 13.0, 15.0, 23.0, 20.0, 20.0, 23.0, 30.0, 30.0, 38.0, 28.0, 28.0, 42.0, 37.0, 35.0, 31.0, 31.0, 40.0, 54.0, 32.0, 39.0, 29.0, 28.0, 42.0, 24.0, 34.0, 27.0, 31.0, 17.0, 17.0, 17.0, 15.0, 11.0, 12.0, 13.0, 6.0, 6.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-39.0625, -37.83154296875, -36.6005859375, -35.36962890625, -34.138671875, -32.90771484375, -31.6767578125, -30.44580078125, -29.21484375, -27.98388671875, -26.7529296875, -25.52197265625, -24.291015625, -23.06005859375, -21.8291015625, -20.59814453125, -19.3671875, -18.13623046875, -16.9052734375, -15.67431640625, -14.443359375, -13.21240234375, -11.9814453125, -10.75048828125, -9.51953125, -8.28857421875, -7.0576171875, -5.82666015625, -4.595703125, -3.36474609375, -2.1337890625, -0.90283203125, 0.328125, 1.55908203125, 2.7900390625, 4.02099609375, 5.251953125, 6.48291015625, 7.7138671875, 8.94482421875, 10.17578125, 11.40673828125, 12.6376953125, 13.86865234375, 15.099609375, 16.33056640625, 17.5615234375, 18.79248046875, 20.0234375, 21.25439453125, 22.4853515625, 23.71630859375, 24.947265625, 26.17822265625, 27.4091796875, 28.64013671875, 29.87109375, 31.10205078125, 32.3330078125, 33.56396484375, 34.794921875, 36.02587890625, 37.2568359375, 38.48779296875, 39.71875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 6.0, 4.0, 6.0, 26.0, 32.0, 42.0, 58.0, 92.0, 123.0, 216.0, 347.0, 567.0, 852.0, 1347.0, 2286.0, 3684.0, 6174.0, 10486.0, 18001.0, 31370.0, 55237.0, 97262.0, 161436.0, 212436.0, 180240.0, 113248.0, 64446.0, 36831.0, 20963.0, 12333.0, 7303.0, 4263.0, 2594.0, 1619.0, 942.0, 595.0, 387.0, 248.0, 172.0, 89.0, 69.0, 44.0, 40.0, 19.0, 14.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.9375, -91.9365234375, -88.935546875, -85.9345703125, -82.93359375, -79.9326171875, -76.931640625, -73.9306640625, -70.9296875, -67.9287109375, -64.927734375, -61.9267578125, -58.92578125, -55.9248046875, -52.923828125, -49.9228515625, -46.921875, -43.9208984375, -40.919921875, -37.9189453125, -34.91796875, -31.9169921875, -28.916015625, -25.9150390625, -22.9140625, -19.9130859375, -16.912109375, -13.9111328125, -10.91015625, -7.9091796875, -4.908203125, -1.9072265625, 1.09375, 4.0947265625, 7.095703125, 10.0966796875, 13.09765625, 16.0986328125, 19.099609375, 22.1005859375, 25.1015625, 28.1025390625, 31.103515625, 34.1044921875, 37.10546875, 40.1064453125, 43.107421875, 46.1083984375, 49.109375, 52.1103515625, 55.111328125, 58.1123046875, 61.11328125, 64.1142578125, 67.115234375, 70.1162109375, 73.1171875, 76.1181640625, 79.119140625, 82.1201171875, 85.12109375, 88.1220703125, 91.123046875, 94.1240234375, 97.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 3.0, 7.0, 5.0, 6.0, 7.0, 14.0, 14.0, 11.0, 16.0, 19.0, 21.0, 30.0, 20.0, 35.0, 30.0, 39.0, 37.0, 28.0, 39.0, 33.0, 35.0, 52.0, 37.0, 26.0, 44.0, 36.0, 43.0, 31.0, 32.0, 19.0, 21.0, 36.0, 17.0, 24.0, 23.0, 18.0, 21.0, 22.0, 11.0, 5.0, 7.0, 7.0, 8.0, 0.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.484375, -27.574462890625, -26.66455078125, -25.754638671875, -24.8447265625, -23.934814453125, -23.02490234375, -22.114990234375, -21.205078125, -20.295166015625, -19.38525390625, -18.475341796875, -17.5654296875, -16.655517578125, -15.74560546875, -14.835693359375, -13.92578125, -13.015869140625, -12.10595703125, -11.196044921875, -10.2861328125, -9.376220703125, -8.46630859375, -7.556396484375, -6.646484375, -5.736572265625, -4.82666015625, -3.916748046875, -3.0068359375, -2.096923828125, -1.18701171875, -0.277099609375, 0.6328125, 1.542724609375, 2.45263671875, 3.362548828125, 4.2724609375, 5.182373046875, 6.09228515625, 7.002197265625, 7.912109375, 8.822021484375, 9.73193359375, 10.641845703125, 11.5517578125, 12.461669921875, 13.37158203125, 14.281494140625, 15.19140625, 16.101318359375, 17.01123046875, 17.921142578125, 18.8310546875, 19.740966796875, 20.65087890625, 21.560791015625, 22.470703125, 23.380615234375, 24.29052734375, 25.200439453125, 26.1103515625, 27.020263671875, 27.93017578125, 28.840087890625, 29.75]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 10.0, 27.0, 24.0, 38.0, 32.0, 61.0, 118.0, 151.0, 231.0, 337.0, 518.0, 790.0, 1360.0, 2033.0, 3538.0, 6297.0, 11463.0, 22830.0, 47217.0, 102316.0, 209058.0, 281411.0, 185647.0, 88017.0, 40878.0, 20021.0, 10212.0, 5461.0, 3195.0, 1902.0, 1171.0, 736.0, 472.0, 333.0, 203.0, 136.0, 97.0, 62.0, 42.0, 32.0, 30.0, 8.0, 14.0, 6.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-55.0, -53.4013671875, -51.802734375, -50.2041015625, -48.60546875, -47.0068359375, -45.408203125, -43.8095703125, -42.2109375, -40.6123046875, -39.013671875, -37.4150390625, -35.81640625, -34.2177734375, -32.619140625, -31.0205078125, -29.421875, -27.8232421875, -26.224609375, -24.6259765625, -23.02734375, -21.4287109375, -19.830078125, -18.2314453125, -16.6328125, -15.0341796875, -13.435546875, -11.8369140625, -10.23828125, -8.6396484375, -7.041015625, -5.4423828125, -3.84375, -2.2451171875, -0.646484375, 0.9521484375, 2.55078125, 4.1494140625, 5.748046875, 7.3466796875, 8.9453125, 10.5439453125, 12.142578125, 13.7412109375, 15.33984375, 16.9384765625, 18.537109375, 20.1357421875, 21.734375, 23.3330078125, 24.931640625, 26.5302734375, 28.12890625, 29.7275390625, 31.326171875, 32.9248046875, 34.5234375, 36.1220703125, 37.720703125, 39.3193359375, 40.91796875, 42.5166015625, 44.115234375, 45.7138671875, 47.3125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 13.0, 11.0, 14.0, 14.0, 18.0, 27.0, 27.0, 31.0, 36.0, 48.0, 51.0, 56.0, 61.0, 69.0, 61.0, 73.0, 60.0, 62.0, 37.0, 43.0, 37.0, 27.0, 26.0, 13.0, 12.0, 17.0, 11.0, 9.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.003437042236328125, -0.0033233165740966797, -0.0032095909118652344, -0.003095865249633789, -0.0029821395874023438, -0.0028684139251708984, -0.002754688262939453, -0.002640962600708008, -0.0025272369384765625, -0.002413511276245117, -0.002299785614013672, -0.0021860599517822266, -0.0020723342895507812, -0.001958608627319336, -0.0018448829650878906, -0.0017311573028564453, -0.001617431640625, -0.0015037059783935547, -0.0013899803161621094, -0.001276254653930664, -0.0011625289916992188, -0.0010488033294677734, -0.0009350776672363281, -0.0008213520050048828, -0.0007076263427734375, -0.0005939006805419922, -0.0004801750183105469, -0.00036644935607910156, -0.00025272369384765625, -0.00013899803161621094, -2.5272369384765625e-05, 8.845329284667969e-05, 0.000202178955078125, 0.0003159046173095703, 0.0004296302795410156, 0.0005433559417724609, 0.0006570816040039062, 0.0007708072662353516, 0.0008845329284667969, 0.0009982585906982422, 0.0011119842529296875, 0.0012257099151611328, 0.0013394355773925781, 0.0014531612396240234, 0.0015668869018554688, 0.001680612564086914, 0.0017943382263183594, 0.0019080638885498047, 0.00202178955078125, 0.0021355152130126953, 0.0022492408752441406, 0.002362966537475586, 0.0024766921997070312, 0.0025904178619384766, 0.002704143524169922, 0.002817869186401367, 0.0029315948486328125, 0.003045320510864258, 0.003159046173095703, 0.0032727718353271484, 0.0033864974975585938, 0.003500223159790039, 0.0036139488220214844, 0.0037276744842529297, 0.003841400146484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 11.0, 10.0, 11.0, 10.0, 22.0, 26.0, 37.0, 50.0, 86.0, 92.0, 177.0, 263.0, 441.0, 677.0, 991.0, 1523.0, 2475.0, 4184.0, 6557.0, 11163.0, 18536.0, 31886.0, 55422.0, 95045.0, 148518.0, 189540.0, 175980.0, 123741.0, 74909.0, 42997.0, 25166.0, 14805.0, 8858.0, 5342.0, 3251.0, 2080.0, 1289.0, 830.0, 537.0, 327.0, 213.0, 151.0, 95.0, 68.0, 53.0, 31.0, 23.0, 26.0, 12.0, 11.0, 4.0, 1.0, 6.0, 4.0, 1.0, 1.0, 2.0], "bins": [-48.78125, -47.29296875, -45.8046875, -44.31640625, -42.828125, -41.33984375, -39.8515625, -38.36328125, -36.875, -35.38671875, -33.8984375, -32.41015625, -30.921875, -29.43359375, -27.9453125, -26.45703125, -24.96875, -23.48046875, -21.9921875, -20.50390625, -19.015625, -17.52734375, -16.0390625, -14.55078125, -13.0625, -11.57421875, -10.0859375, -8.59765625, -7.109375, -5.62109375, -4.1328125, -2.64453125, -1.15625, 0.33203125, 1.8203125, 3.30859375, 4.796875, 6.28515625, 7.7734375, 9.26171875, 10.75, 12.23828125, 13.7265625, 15.21484375, 16.703125, 18.19140625, 19.6796875, 21.16796875, 22.65625, 24.14453125, 25.6328125, 27.12109375, 28.609375, 30.09765625, 31.5859375, 33.07421875, 34.5625, 36.05078125, 37.5390625, 39.02734375, 40.515625, 42.00390625, 43.4921875, 44.98046875, 46.46875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 6.0, 10.0, 4.0, 5.0, 9.0, 9.0, 11.0, 20.0, 22.0, 24.0, 30.0, 38.0, 32.0, 43.0, 54.0, 44.0, 54.0, 48.0, 57.0, 45.0, 51.0, 48.0, 57.0, 32.0, 41.0, 50.0, 18.0, 30.0, 21.0, 10.0, 15.0, 12.0, 8.0, 11.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-18.03125, -17.527099609375, -17.02294921875, -16.518798828125, -16.0146484375, -15.510498046875, -15.00634765625, -14.502197265625, -13.998046875, -13.493896484375, -12.98974609375, -12.485595703125, -11.9814453125, -11.477294921875, -10.97314453125, -10.468994140625, -9.96484375, -9.460693359375, -8.95654296875, -8.452392578125, -7.9482421875, -7.444091796875, -6.93994140625, -6.435791015625, -5.931640625, -5.427490234375, -4.92333984375, -4.419189453125, -3.9150390625, -3.410888671875, -2.90673828125, -2.402587890625, -1.8984375, -1.394287109375, -0.89013671875, -0.385986328125, 0.1181640625, 0.622314453125, 1.12646484375, 1.630615234375, 2.134765625, 2.638916015625, 3.14306640625, 3.647216796875, 4.1513671875, 4.655517578125, 5.15966796875, 5.663818359375, 6.16796875, 6.672119140625, 7.17626953125, 7.680419921875, 8.1845703125, 8.688720703125, 9.19287109375, 9.697021484375, 10.201171875, 10.705322265625, 11.20947265625, 11.713623046875, 12.2177734375, 12.721923828125, 13.22607421875, 13.730224609375, 14.234375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 6.0, 4.0, 6.0, 4.0, 6.0, 15.0, 8.0, 16.0, 21.0, 23.0, 30.0, 32.0, 25.0, 37.0, 46.0, 44.0, 40.0, 44.0, 43.0, 40.0, 39.0, 50.0, 40.0, 48.0, 45.0, 30.0, 32.0, 39.0, 34.0, 27.0, 15.0, 22.0, 16.0, 13.0, 18.0, 11.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.12483596801758, -44.69575500488281, -43.26667785644531, -41.83759689331055, -40.40851593017578, -38.979434967041016, -37.55035400390625, -36.12127685546875, -34.692195892333984, -33.26311492919922, -31.834035873413086, -30.404956817626953, -28.975875854492188, -27.546794891357422, -26.11771583557129, -24.688636779785156, -23.25955581665039, -21.830474853515625, -20.401395797729492, -18.97231674194336, -17.543235778808594, -16.114154815673828, -14.685075759887695, -13.255995750427246, -11.826915740966797, -10.397835731506348, -8.968755722045898, -7.539675712585449, -6.110595703125, -4.681515693664551, -3.2524356842041016, -1.8233556747436523, -0.3942756652832031, 1.034804344177246, 2.4638843536376953, 3.8929643630981445, 5.322044372558594, 6.751124382019043, 8.180204391479492, 9.609284400939941, 11.03836441040039, 12.46744441986084, 13.896524429321289, 15.325604438781738, 16.754684448242188, 18.183765411376953, 19.612844467163086, 21.04192352294922, 22.471004486083984, 23.90008544921875, 25.329164505004883, 26.758243560791016, 28.18732452392578, 29.616405487060547, 31.04548454284668, 32.47456359863281, 33.90364456176758, 35.332725524902344, 36.761802673339844, 38.19088363647461, 39.619964599609375, 41.04904556274414, 42.478126525878906, 43.907203674316406, 45.33628463745117]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 6.0, 7.0, 6.0, 9.0, 7.0, 17.0, 17.0, 25.0, 18.0, 18.0, 32.0, 28.0, 32.0, 32.0, 23.0, 33.0, 49.0, 42.0, 53.0, 40.0, 43.0, 49.0, 38.0, 48.0, 39.0, 36.0, 31.0, 32.0, 30.0, 28.0, 26.0, 16.0, 16.0, 16.0, 9.0, 14.0, 12.0, 14.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-46.6157341003418, -45.24986267089844, -43.883995056152344, -42.518123626708984, -41.15225601196289, -39.78638458251953, -38.42051696777344, -37.05464553833008, -35.68877410888672, -34.32290267944336, -32.957035064697266, -31.591163635253906, -30.225296020507812, -28.859424591064453, -27.493555068969727, -26.127685546875, -24.761817932128906, -23.39594841003418, -22.030078887939453, -20.664207458496094, -19.29833984375, -17.93246841430664, -16.566598892211914, -15.200729370117188, -13.834859848022461, -12.468990325927734, -11.103120803833008, -9.737250328063965, -8.371380805969238, -7.005511283874512, -5.639640808105469, -4.273771286010742, -2.9079017639160156, -1.54203200340271, -0.1761622428894043, 1.1897077560424805, 2.555577278137207, 3.9214468002319336, 5.287317276000977, 6.653186798095703, 8.01905632019043, 9.384925842285156, 10.750795364379883, 12.116665840148926, 13.482535362243652, 14.848404884338379, 16.214275360107422, 17.58014488220215, 18.946014404296875, 20.3118839263916, 21.677753448486328, 23.043624877929688, 24.40949249267578, 25.77536392211914, 27.141233444213867, 28.507102966308594, 29.87297248840332, 31.238842010498047, 32.604713439941406, 33.9705810546875, 35.33645248413086, 36.70232009887695, 38.06819152832031, 39.434059143066406, 40.799930572509766]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 15.0, 21.0, 25.0, 33.0, 71.0, 119.0, 151.0, 267.0, 400.0, 661.0, 950.0, 1601.0, 2401.0, 3778.0, 5804.0, 8618.0, 12979.0, 18839.0, 26613.0, 36642.0, 48376.0, 61852.0, 75271.0, 87101.0, 95008.0, 97186.0, 93409.0, 85003.0, 71995.0, 58255.0, 45051.0, 33737.0, 24487.0, 17353.0, 11813.0, 7891.0, 5201.0, 3439.0, 2224.0, 1404.0, 919.0, 612.0, 362.0, 228.0, 155.0, 83.0, 60.0, 41.0, 21.0, 14.0, 9.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.15625, -31.1630859375, -30.169921875, -29.1767578125, -28.18359375, -27.1904296875, -26.197265625, -25.2041015625, -24.2109375, -23.2177734375, -22.224609375, -21.2314453125, -20.23828125, -19.2451171875, -18.251953125, -17.2587890625, -16.265625, -15.2724609375, -14.279296875, -13.2861328125, -12.29296875, -11.2998046875, -10.306640625, -9.3134765625, -8.3203125, -7.3271484375, -6.333984375, -5.3408203125, -4.34765625, -3.3544921875, -2.361328125, -1.3681640625, -0.375, 0.6181640625, 1.611328125, 2.6044921875, 3.59765625, 4.5908203125, 5.583984375, 6.5771484375, 7.5703125, 8.5634765625, 9.556640625, 10.5498046875, 11.54296875, 12.5361328125, 13.529296875, 14.5224609375, 15.515625, 16.5087890625, 17.501953125, 18.4951171875, 19.48828125, 20.4814453125, 21.474609375, 22.4677734375, 23.4609375, 24.4541015625, 25.447265625, 26.4404296875, 27.43359375, 28.4267578125, 29.419921875, 30.4130859375, 31.40625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 8.0, 11.0, 13.0, 12.0, 17.0, 17.0, 20.0, 20.0, 23.0, 24.0, 27.0, 29.0, 28.0, 14.0, 45.0, 40.0, 44.0, 51.0, 46.0, 37.0, 43.0, 49.0, 43.0, 35.0, 29.0, 30.0, 36.0, 32.0, 18.0, 32.0, 23.0, 19.0, 14.0, 10.0, 12.0, 8.0, 7.0, 13.0, 4.0, 9.0, 2.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.28125, -43.9560546875, -42.630859375, -41.3056640625, -39.98046875, -38.6552734375, -37.330078125, -36.0048828125, -34.6796875, -33.3544921875, -32.029296875, -30.7041015625, -29.37890625, -28.0537109375, -26.728515625, -25.4033203125, -24.078125, -22.7529296875, -21.427734375, -20.1025390625, -18.77734375, -17.4521484375, -16.126953125, -14.8017578125, -13.4765625, -12.1513671875, -10.826171875, -9.5009765625, -8.17578125, -6.8505859375, -5.525390625, -4.2001953125, -2.875, -1.5498046875, -0.224609375, 1.1005859375, 2.42578125, 3.7509765625, 5.076171875, 6.4013671875, 7.7265625, 9.0517578125, 10.376953125, 11.7021484375, 13.02734375, 14.3525390625, 15.677734375, 17.0029296875, 18.328125, 19.6533203125, 20.978515625, 22.3037109375, 23.62890625, 24.9541015625, 26.279296875, 27.6044921875, 28.9296875, 30.2548828125, 31.580078125, 32.9052734375, 34.23046875, 35.5556640625, 36.880859375, 38.2060546875, 39.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 4.0, 8.0, 17.0, 27.0, 38.0, 69.0, 96.0, 151.0, 250.0, 378.0, 654.0, 959.0, 1404.0, 2202.0, 3226.0, 4831.0, 7241.0, 10437.0, 14701.0, 20613.0, 28701.0, 38952.0, 50582.0, 63513.0, 76727.0, 87438.0, 93176.0, 95148.0, 90099.0, 80182.0, 68313.0, 55750.0, 42941.0, 32448.0, 23769.0, 16874.0, 11871.0, 8281.0, 5417.0, 3740.0, 2533.0, 1695.0, 1125.0, 708.0, 442.0, 343.0, 198.0, 120.0, 65.0, 41.0, 27.0, 13.0, 10.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-34.59375, -33.44775390625, -32.3017578125, -31.15576171875, -30.009765625, -28.86376953125, -27.7177734375, -26.57177734375, -25.42578125, -24.27978515625, -23.1337890625, -21.98779296875, -20.841796875, -19.69580078125, -18.5498046875, -17.40380859375, -16.2578125, -15.11181640625, -13.9658203125, -12.81982421875, -11.673828125, -10.52783203125, -9.3818359375, -8.23583984375, -7.08984375, -5.94384765625, -4.7978515625, -3.65185546875, -2.505859375, -1.35986328125, -0.2138671875, 0.93212890625, 2.078125, 3.22412109375, 4.3701171875, 5.51611328125, 6.662109375, 7.80810546875, 8.9541015625, 10.10009765625, 11.24609375, 12.39208984375, 13.5380859375, 14.68408203125, 15.830078125, 16.97607421875, 18.1220703125, 19.26806640625, 20.4140625, 21.56005859375, 22.7060546875, 23.85205078125, 24.998046875, 26.14404296875, 27.2900390625, 28.43603515625, 29.58203125, 30.72802734375, 31.8740234375, 33.02001953125, 34.166015625, 35.31201171875, 36.4580078125, 37.60400390625, 38.75]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 8.0, 2.0, 7.0, 3.0, 13.0, 9.0, 8.0, 16.0, 13.0, 22.0, 22.0, 21.0, 24.0, 28.0, 30.0, 30.0, 35.0, 46.0, 40.0, 25.0, 29.0, 50.0, 51.0, 44.0, 53.0, 31.0, 39.0, 33.0, 46.0, 24.0, 24.0, 22.0, 24.0, 24.0, 22.0, 18.0, 15.0, 14.0, 6.0, 9.0, 7.0, 4.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-33.375, -32.478271484375, -31.58154296875, -30.684814453125, -29.7880859375, -28.891357421875, -27.99462890625, -27.097900390625, -26.201171875, -25.304443359375, -24.40771484375, -23.510986328125, -22.6142578125, -21.717529296875, -20.82080078125, -19.924072265625, -19.02734375, -18.130615234375, -17.23388671875, -16.337158203125, -15.4404296875, -14.543701171875, -13.64697265625, -12.750244140625, -11.853515625, -10.956787109375, -10.06005859375, -9.163330078125, -8.2666015625, -7.369873046875, -6.47314453125, -5.576416015625, -4.6796875, -3.782958984375, -2.88623046875, -1.989501953125, -1.0927734375, -0.196044921875, 0.70068359375, 1.597412109375, 2.494140625, 3.390869140625, 4.28759765625, 5.184326171875, 6.0810546875, 6.977783203125, 7.87451171875, 8.771240234375, 9.66796875, 10.564697265625, 11.46142578125, 12.358154296875, 13.2548828125, 14.151611328125, 15.04833984375, 15.945068359375, 16.841796875, 17.738525390625, 18.63525390625, 19.531982421875, 20.4287109375, 21.325439453125, 22.22216796875, 23.118896484375, 24.015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 13.0, 17.0, 26.0, 34.0, 72.0, 104.0, 171.0, 256.0, 342.0, 541.0, 827.0, 1351.0, 2034.0, 3337.0, 5252.0, 8327.0, 13072.0, 20199.0, 31060.0, 45747.0, 65613.0, 87161.0, 107070.0, 120321.0, 120986.0, 110523.0, 90793.0, 69289.0, 49288.0, 33620.0, 22026.0, 14302.0, 9084.0, 5814.0, 3587.0, 2284.0, 1483.0, 926.0, 551.0, 353.0, 241.0, 140.0, 104.0, 68.0, 46.0, 35.0, 24.0, 16.0, 10.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.3203125, -12.9052734375, -12.490234375, -12.0751953125, -11.66015625, -11.2451171875, -10.830078125, -10.4150390625, -10.0, -9.5849609375, -9.169921875, -8.7548828125, -8.33984375, -7.9248046875, -7.509765625, -7.0947265625, -6.6796875, -6.2646484375, -5.849609375, -5.4345703125, -5.01953125, -4.6044921875, -4.189453125, -3.7744140625, -3.359375, -2.9443359375, -2.529296875, -2.1142578125, -1.69921875, -1.2841796875, -0.869140625, -0.4541015625, -0.0390625, 0.3759765625, 0.791015625, 1.2060546875, 1.62109375, 2.0361328125, 2.451171875, 2.8662109375, 3.28125, 3.6962890625, 4.111328125, 4.5263671875, 4.94140625, 5.3564453125, 5.771484375, 6.1865234375, 6.6015625, 7.0166015625, 7.431640625, 7.8466796875, 8.26171875, 8.6767578125, 9.091796875, 9.5068359375, 9.921875, 10.3369140625, 10.751953125, 11.1669921875, 11.58203125, 11.9970703125, 12.412109375, 12.8271484375, 13.2421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 11.0, 5.0, 6.0, 11.0, 12.0, 26.0, 23.0, 36.0, 38.0, 43.0, 50.0, 52.0, 52.0, 63.0, 63.0, 63.0, 70.0, 51.0, 59.0, 51.0, 39.0, 30.0, 35.0, 17.0, 18.0, 14.0, 16.0, 9.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020351409912109375, -0.0019670426845550537, -0.00189894437789917, -0.0018308460712432861, -0.0017627477645874023, -0.0016946494579315186, -0.0016265511512756348, -0.001558452844619751, -0.0014903545379638672, -0.0014222562313079834, -0.0013541579246520996, -0.0012860596179962158, -0.001217961311340332, -0.0011498630046844482, -0.0010817646980285645, -0.0010136663913726807, -0.0009455680847167969, -0.0008774697780609131, -0.0008093714714050293, -0.0007412731647491455, -0.0006731748580932617, -0.0006050765514373779, -0.0005369782447814941, -0.00046887993812561035, -0.00040078163146972656, -0.0003326833248138428, -0.000264585018157959, -0.0001964867115020752, -0.0001283884048461914, -6.029009819030762e-05, 7.808208465576172e-06, 7.590651512145996e-05, 0.00014400482177734375, 0.00021210312843322754, 0.00028020143508911133, 0.0003482997417449951, 0.0004163980484008789, 0.0004844963550567627, 0.0005525946617126465, 0.0006206929683685303, 0.0006887912750244141, 0.0007568895816802979, 0.0008249878883361816, 0.0008930861949920654, 0.0009611845016479492, 0.001029282808303833, 0.0010973811149597168, 0.0011654794216156006, 0.0012335777282714844, 0.0013016760349273682, 0.001369774341583252, 0.0014378726482391357, 0.0015059709548950195, 0.0015740692615509033, 0.0016421675682067871, 0.001710265874862671, 0.0017783641815185547, 0.0018464624881744385, 0.0019145607948303223, 0.001982659101486206, 0.00205075740814209, 0.0021188557147979736, 0.0021869540214538574, 0.002255052328109741, 0.002323150634765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 7.0, 7.0, 12.0, 17.0, 23.0, 46.0, 61.0, 108.0, 140.0, 240.0, 346.0, 508.0, 862.0, 1320.0, 2022.0, 3352.0, 5280.0, 8755.0, 13878.0, 21283.0, 32484.0, 48107.0, 66730.0, 87568.0, 107845.0, 119170.0, 119452.0, 107581.0, 89966.0, 68389.0, 49154.0, 33283.0, 22209.0, 14162.0, 9043.0, 5683.0, 3449.0, 2197.0, 1361.0, 878.0, 561.0, 352.0, 203.0, 159.0, 113.0, 77.0, 34.0, 36.0, 14.0, 13.0, 11.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-13.3671875, -12.949951171875, -12.53271484375, -12.115478515625, -11.6982421875, -11.281005859375, -10.86376953125, -10.446533203125, -10.029296875, -9.612060546875, -9.19482421875, -8.777587890625, -8.3603515625, -7.943115234375, -7.52587890625, -7.108642578125, -6.69140625, -6.274169921875, -5.85693359375, -5.439697265625, -5.0224609375, -4.605224609375, -4.18798828125, -3.770751953125, -3.353515625, -2.936279296875, -2.51904296875, -2.101806640625, -1.6845703125, -1.267333984375, -0.85009765625, -0.432861328125, -0.015625, 0.401611328125, 0.81884765625, 1.236083984375, 1.6533203125, 2.070556640625, 2.48779296875, 2.905029296875, 3.322265625, 3.739501953125, 4.15673828125, 4.573974609375, 4.9912109375, 5.408447265625, 5.82568359375, 6.242919921875, 6.66015625, 7.077392578125, 7.49462890625, 7.911865234375, 8.3291015625, 8.746337890625, 9.16357421875, 9.580810546875, 9.998046875, 10.415283203125, 10.83251953125, 11.249755859375, 11.6669921875, 12.084228515625, 12.50146484375, 12.918701171875, 13.3359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 6.0, 8.0, 11.0, 11.0, 16.0, 22.0, 23.0, 15.0, 27.0, 34.0, 40.0, 51.0, 50.0, 44.0, 60.0, 53.0, 47.0, 56.0, 58.0, 42.0, 42.0, 38.0, 43.0, 30.0, 25.0, 22.0, 17.0, 19.0, 9.0, 15.0, 15.0, 12.0, 9.0, 5.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2109375, -6.01531982421875, -5.8197021484375, -5.62408447265625, -5.428466796875, -5.23284912109375, -5.0372314453125, -4.84161376953125, -4.64599609375, -4.45037841796875, -4.2547607421875, -4.05914306640625, -3.863525390625, -3.66790771484375, -3.4722900390625, -3.27667236328125, -3.0810546875, -2.88543701171875, -2.6898193359375, -2.49420166015625, -2.298583984375, -2.10296630859375, -1.9073486328125, -1.71173095703125, -1.51611328125, -1.32049560546875, -1.1248779296875, -0.92926025390625, -0.733642578125, -0.53802490234375, -0.3424072265625, -0.14678955078125, 0.048828125, 0.24444580078125, 0.4400634765625, 0.63568115234375, 0.831298828125, 1.02691650390625, 1.2225341796875, 1.41815185546875, 1.61376953125, 1.80938720703125, 2.0050048828125, 2.20062255859375, 2.396240234375, 2.59185791015625, 2.7874755859375, 2.98309326171875, 3.1787109375, 3.37432861328125, 3.5699462890625, 3.76556396484375, 3.961181640625, 4.15679931640625, 4.3524169921875, 4.54803466796875, 4.74365234375, 4.93927001953125, 5.1348876953125, 5.33050537109375, 5.526123046875, 5.72174072265625, 5.9173583984375, 6.11297607421875, 6.30859375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0, 7.0, 8.0, 6.0, 8.0, 12.0, 16.0, 18.0, 22.0, 20.0, 29.0, 29.0, 29.0, 34.0, 37.0, 31.0, 47.0, 42.0, 47.0, 36.0, 40.0, 39.0, 44.0, 50.0, 38.0, 35.0, 38.0, 36.0, 27.0, 27.0, 28.0, 22.0, 15.0, 8.0, 11.0, 5.0, 11.0, 13.0, 5.0, 10.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.402565002441406, -40.03293991088867, -38.66331481933594, -37.29368591308594, -35.9240608215332, -34.55443572998047, -33.18480682373047, -31.815181732177734, -30.445556640625, -29.075931549072266, -27.7063045501709, -26.33667755126953, -24.967052459716797, -23.597427368164062, -22.227800369262695, -20.858173370361328, -19.488548278808594, -18.11892318725586, -16.749296188354492, -15.379670143127441, -14.01004409790039, -12.64041805267334, -11.270792007446289, -9.901165962219238, -8.531539916992188, -7.161913871765137, -5.792287826538086, -4.422661781311035, -3.0530357360839844, -1.6834096908569336, -0.3137836456298828, 1.055842399597168, 2.4254684448242188, 3.7950944900512695, 5.16472053527832, 6.534346580505371, 7.903972625732422, 9.273598670959473, 10.643224716186523, 12.012850761413574, 13.382476806640625, 14.752102851867676, 16.121728897094727, 17.491355895996094, 18.860980987548828, 20.230606079101562, 21.60023307800293, 22.969860076904297, 24.33948516845703, 25.709110260009766, 27.078737258911133, 28.4483642578125, 29.817989349365234, 31.18761444091797, 32.55724334716797, 33.9268684387207, 35.29649353027344, 36.66611862182617, 38.035743713378906, 39.405372619628906, 40.77499771118164, 42.144622802734375, 43.514251708984375, 44.88387680053711, 46.253501892089844]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 4.0, 8.0, 9.0, 12.0, 5.0, 8.0, 13.0, 15.0, 18.0, 28.0, 24.0, 21.0, 25.0, 26.0, 35.0, 32.0, 29.0, 29.0, 42.0, 33.0, 38.0, 35.0, 36.0, 45.0, 31.0, 41.0, 26.0, 37.0, 47.0, 24.0, 20.0, 16.0, 22.0, 17.0, 25.0, 24.0, 14.0, 20.0, 21.0, 12.0, 16.0, 8.0, 3.0, 3.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.50913619995117, -37.23678207397461, -35.96442794799805, -34.69207763671875, -33.41972351074219, -32.147369384765625, -30.875015258789062, -29.6026611328125, -28.33030891418457, -27.057954788208008, -25.785602569580078, -24.513248443603516, -23.240894317626953, -21.968542098999023, -20.69618797302246, -19.42383575439453, -18.15148162841797, -16.879127502441406, -15.606775283813477, -14.334421157836914, -13.062067985534668, -11.789714813232422, -10.51736068725586, -9.245007514953613, -7.972654342651367, -6.700301170349121, -5.427947521209717, -4.1555938720703125, -2.8832406997680664, -1.6108875274658203, -0.338533878326416, 0.9338197708129883, 2.2061729431152344, 3.4785263538360596, 4.750879764556885, 6.023233413696289, 7.295586585998535, 8.567939758300781, 9.840293884277344, 11.11264705657959, 12.385000228881836, 13.657353401184082, 14.929706573486328, 16.20206069946289, 17.474414825439453, 18.746767044067383, 20.019121170043945, 21.291473388671875, 22.563827514648438, 23.836181640625, 25.10853385925293, 26.380887985229492, 27.653240203857422, 28.925594329833984, 30.197948455810547, 31.47030258178711, 32.742652893066406, 34.01500701904297, 35.28736114501953, 36.55971145629883, 37.83206558227539, 39.10441970825195, 40.376773834228516, 41.64912796020508, 42.92148208618164]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 10.0, 20.0, 33.0, 43.0, 70.0, 136.0, 218.0, 370.0, 646.0, 1143.0, 1959.0, 3337.0, 5799.0, 9902.0, 16897.0, 29108.0, 50645.0, 88685.0, 153649.0, 266462.0, 440401.0, 644543.0, 748397.0, 649137.0, 446081.0, 269300.0, 155793.0, 89312.0, 51183.0, 29522.0, 17052.0, 9918.0, 5848.0, 3527.0, 2072.0, 1250.0, 725.0, 427.0, 269.0, 166.0, 83.0, 48.0, 29.0, 21.0, 16.0, 12.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.21875, -44.751953125, -43.28515625, -41.818359375, -40.3515625, -38.884765625, -37.41796875, -35.951171875, -34.484375, -33.017578125, -31.55078125, -30.083984375, -28.6171875, -27.150390625, -25.68359375, -24.216796875, -22.75, -21.283203125, -19.81640625, -18.349609375, -16.8828125, -15.416015625, -13.94921875, -12.482421875, -11.015625, -9.548828125, -8.08203125, -6.615234375, -5.1484375, -3.681640625, -2.21484375, -0.748046875, 0.71875, 2.185546875, 3.65234375, 5.119140625, 6.5859375, 8.052734375, 9.51953125, 10.986328125, 12.453125, 13.919921875, 15.38671875, 16.853515625, 18.3203125, 19.787109375, 21.25390625, 22.720703125, 24.1875, 25.654296875, 27.12109375, 28.587890625, 30.0546875, 31.521484375, 32.98828125, 34.455078125, 35.921875, 37.388671875, 38.85546875, 40.322265625, 41.7890625, 43.255859375, 44.72265625, 46.189453125, 47.65625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 8.0, 4.0, 9.0, 15.0, 9.0, 15.0, 19.0, 19.0, 26.0, 31.0, 19.0, 33.0, 26.0, 42.0, 25.0, 25.0, 37.0, 28.0, 41.0, 26.0, 45.0, 36.0, 45.0, 34.0, 31.0, 27.0, 31.0, 25.0, 35.0, 30.0, 23.0, 23.0, 21.0, 28.0, 11.0, 21.0, 14.0, 15.0, 13.0, 12.0, 5.0, 3.0, 6.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.984375, -30.938232421875, -29.89208984375, -28.845947265625, -27.7998046875, -26.753662109375, -25.70751953125, -24.661376953125, -23.615234375, -22.569091796875, -21.52294921875, -20.476806640625, -19.4306640625, -18.384521484375, -17.33837890625, -16.292236328125, -15.24609375, -14.199951171875, -13.15380859375, -12.107666015625, -11.0615234375, -10.015380859375, -8.96923828125, -7.923095703125, -6.876953125, -5.830810546875, -4.78466796875, -3.738525390625, -2.6923828125, -1.646240234375, -0.60009765625, 0.446044921875, 1.4921875, 2.538330078125, 3.58447265625, 4.630615234375, 5.6767578125, 6.722900390625, 7.76904296875, 8.815185546875, 9.861328125, 10.907470703125, 11.95361328125, 12.999755859375, 14.0458984375, 15.092041015625, 16.13818359375, 17.184326171875, 18.23046875, 19.276611328125, 20.32275390625, 21.368896484375, 22.4150390625, 23.461181640625, 24.50732421875, 25.553466796875, 26.599609375, 27.645751953125, 28.69189453125, 29.738037109375, 30.7841796875, 31.830322265625, 32.87646484375, 33.922607421875, 34.96875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 4.0, 13.0, 26.0, 52.0, 60.0, 95.0, 130.0, 227.0, 392.0, 577.0, 996.0, 1525.0, 2539.0, 4137.0, 6642.0, 10864.0, 17673.0, 28992.0, 46956.0, 74857.0, 120429.0, 187498.0, 283549.0, 405363.0, 532817.0, 597306.0, 555694.0, 438641.0, 311419.0, 209106.0, 134074.0, 84761.0, 52311.0, 32424.0, 20147.0, 12318.0, 7533.0, 4723.0, 2839.0, 1756.0, 1092.0, 680.0, 400.0, 228.0, 145.0, 84.0, 61.0, 51.0, 24.0, 19.0, 11.0, 12.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-34.65625, -33.486328125, -32.31640625, -31.146484375, -29.9765625, -28.806640625, -27.63671875, -26.466796875, -25.296875, -24.126953125, -22.95703125, -21.787109375, -20.6171875, -19.447265625, -18.27734375, -17.107421875, -15.9375, -14.767578125, -13.59765625, -12.427734375, -11.2578125, -10.087890625, -8.91796875, -7.748046875, -6.578125, -5.408203125, -4.23828125, -3.068359375, -1.8984375, -0.728515625, 0.44140625, 1.611328125, 2.78125, 3.951171875, 5.12109375, 6.291015625, 7.4609375, 8.630859375, 9.80078125, 10.970703125, 12.140625, 13.310546875, 14.48046875, 15.650390625, 16.8203125, 17.990234375, 19.16015625, 20.330078125, 21.5, 22.669921875, 23.83984375, 25.009765625, 26.1796875, 27.349609375, 28.51953125, 29.689453125, 30.859375, 32.029296875, 33.19921875, 34.369140625, 35.5390625, 36.708984375, 37.87890625, 39.048828125, 40.21875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 1.0, 6.0, 6.0, 2.0, 9.0, 6.0, 16.0, 13.0, 16.0, 20.0, 29.0, 35.0, 44.0, 47.0, 45.0, 68.0, 69.0, 78.0, 98.0, 99.0, 130.0, 138.0, 144.0, 164.0, 172.0, 199.0, 184.0, 209.0, 229.0, 217.0, 186.0, 171.0, 159.0, 155.0, 141.0, 128.0, 101.0, 101.0, 79.0, 65.0, 60.0, 43.0, 51.0, 41.0, 29.0, 12.0, 19.0, 12.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0], "bins": [-14.9375, -14.4820556640625, -14.026611328125, -13.5711669921875, -13.11572265625, -12.6602783203125, -12.204833984375, -11.7493896484375, -11.2939453125, -10.8385009765625, -10.383056640625, -9.9276123046875, -9.47216796875, -9.0167236328125, -8.561279296875, -8.1058349609375, -7.650390625, -7.1949462890625, -6.739501953125, -6.2840576171875, -5.82861328125, -5.3731689453125, -4.917724609375, -4.4622802734375, -4.0068359375, -3.5513916015625, -3.095947265625, -2.6405029296875, -2.18505859375, -1.7296142578125, -1.274169921875, -0.8187255859375, -0.36328125, 0.0921630859375, 0.547607421875, 1.0030517578125, 1.45849609375, 1.9139404296875, 2.369384765625, 2.8248291015625, 3.2802734375, 3.7357177734375, 4.191162109375, 4.6466064453125, 5.10205078125, 5.5574951171875, 6.012939453125, 6.4683837890625, 6.923828125, 7.3792724609375, 7.834716796875, 8.2901611328125, 8.74560546875, 9.2010498046875, 9.656494140625, 10.1119384765625, 10.5673828125, 11.0228271484375, 11.478271484375, 11.9337158203125, 12.38916015625, 12.8446044921875, 13.300048828125, 13.7554931640625, 14.2109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 6.0, 7.0, 3.0, 9.0, 11.0, 12.0, 14.0, 14.0, 23.0, 16.0, 18.0, 34.0, 41.0, 31.0, 45.0, 44.0, 36.0, 41.0, 38.0, 46.0, 52.0, 51.0, 55.0, 47.0, 36.0, 28.0, 51.0, 23.0, 26.0, 27.0, 24.0, 16.0, 16.0, 8.0, 11.0, 9.0, 8.0, 6.0, 7.0, 7.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.242271423339844, -43.82782745361328, -42.41338348388672, -40.998939514160156, -39.584495544433594, -38.17005157470703, -36.75560760498047, -35.341163635253906, -33.926719665527344, -32.51227569580078, -31.09783172607422, -29.683387756347656, -28.268943786621094, -26.85449981689453, -25.44005584716797, -24.025611877441406, -22.611167907714844, -21.19672393798828, -19.78227996826172, -18.367835998535156, -16.953392028808594, -15.538948059082031, -14.124504089355469, -12.710060119628906, -11.295616149902344, -9.881172180175781, -8.466728210449219, -7.052284240722656, -5.637840270996094, -4.223396301269531, -2.8089523315429688, -1.3945083618164062, 0.01993560791015625, 1.4343795776367188, 2.8488235473632812, 4.263267517089844, 5.677711486816406, 7.092155456542969, 8.506599426269531, 9.921043395996094, 11.335487365722656, 12.749931335449219, 14.164375305175781, 15.578819274902344, 16.993263244628906, 18.40770721435547, 19.82215118408203, 21.236595153808594, 22.651039123535156, 24.06548309326172, 25.47992706298828, 26.894371032714844, 28.308815002441406, 29.72325897216797, 31.13770294189453, 32.552146911621094, 33.966590881347656, 35.38103485107422, 36.79547882080078, 38.209922790527344, 39.624366760253906, 41.03881072998047, 42.45325469970703, 43.867698669433594, 45.282142639160156]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 7.0, 9.0, 10.0, 10.0, 12.0, 13.0, 17.0, 21.0, 13.0, 22.0, 30.0, 26.0, 32.0, 39.0, 31.0, 43.0, 54.0, 39.0, 31.0, 39.0, 41.0, 37.0, 46.0, 41.0, 22.0, 30.0, 34.0, 30.0, 38.0, 25.0, 30.0, 18.0, 14.0, 15.0, 19.0, 8.0, 13.0, 5.0, 13.0, 9.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.3831672668457, -38.076507568359375, -36.76984405517578, -35.46318054199219, -34.15652084350586, -32.84986114501953, -31.543197631835938, -30.236536026000977, -28.929874420166016, -27.623212814331055, -26.316551208496094, -25.009889602661133, -23.703227996826172, -22.39656639099121, -21.08990478515625, -19.78324317932129, -18.476581573486328, -17.169919967651367, -15.863258361816406, -14.556596755981445, -13.249935150146484, -11.943273544311523, -10.636611938476562, -9.329950332641602, -8.02328872680664, -6.71662712097168, -5.409965515136719, -4.103303909301758, -2.796642303466797, -1.489980697631836, -0.183319091796875, 1.123342514038086, 2.4300003051757812, 3.736661911010742, 5.043323516845703, 6.349985122680664, 7.656646728515625, 8.963308334350586, 10.269969940185547, 11.576631546020508, 12.883293151855469, 14.18995475769043, 15.49661636352539, 16.80327796936035, 18.109939575195312, 19.416601181030273, 20.723262786865234, 22.029924392700195, 23.336585998535156, 24.643247604370117, 25.949909210205078, 27.25657081604004, 28.563232421875, 29.86989402770996, 31.176555633544922, 32.48321533203125, 33.789878845214844, 35.09654235839844, 36.403202056884766, 37.709861755371094, 39.01652526855469, 40.32318878173828, 41.62984848022461, 42.93650817871094, 44.24317169189453]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 10.0, 16.0, 14.0, 23.0, 42.0, 57.0, 131.0, 177.0, 271.0, 433.0, 637.0, 1075.0, 1546.0, 2571.0, 3914.0, 6004.0, 9421.0, 14349.0, 21475.0, 30636.0, 43349.0, 58393.0, 76033.0, 94725.0, 108627.0, 113394.0, 106863.0, 92919.0, 74427.0, 57251.0, 41381.0, 29552.0, 20165.0, 13495.0, 8965.0, 5800.0, 3747.0, 2443.0, 1518.0, 990.0, 659.0, 391.0, 238.0, 180.0, 92.0, 70.0, 39.0, 24.0, 15.0, 4.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.40625, -53.64404296875, -51.8818359375, -50.11962890625, -48.357421875, -46.59521484375, -44.8330078125, -43.07080078125, -41.30859375, -39.54638671875, -37.7841796875, -36.02197265625, -34.259765625, -32.49755859375, -30.7353515625, -28.97314453125, -27.2109375, -25.44873046875, -23.6865234375, -21.92431640625, -20.162109375, -18.39990234375, -16.6376953125, -14.87548828125, -13.11328125, -11.35107421875, -9.5888671875, -7.82666015625, -6.064453125, -4.30224609375, -2.5400390625, -0.77783203125, 0.984375, 2.74658203125, 4.5087890625, 6.27099609375, 8.033203125, 9.79541015625, 11.5576171875, 13.31982421875, 15.08203125, 16.84423828125, 18.6064453125, 20.36865234375, 22.130859375, 23.89306640625, 25.6552734375, 27.41748046875, 29.1796875, 30.94189453125, 32.7041015625, 34.46630859375, 36.228515625, 37.99072265625, 39.7529296875, 41.51513671875, 43.27734375, 45.03955078125, 46.8017578125, 48.56396484375, 50.326171875, 52.08837890625, 53.8505859375, 55.61279296875, 57.375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 7.0, 6.0, 13.0, 13.0, 20.0, 16.0, 31.0, 14.0, 24.0, 28.0, 40.0, 34.0, 29.0, 40.0, 47.0, 32.0, 55.0, 43.0, 32.0, 40.0, 31.0, 39.0, 39.0, 38.0, 35.0, 31.0, 20.0, 35.0, 23.0, 18.0, 19.0, 20.0, 15.0, 17.0, 11.0, 6.0, 12.0, 6.0, 7.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.03125, -25.08740234375, -24.1435546875, -23.19970703125, -22.255859375, -21.31201171875, -20.3681640625, -19.42431640625, -18.48046875, -17.53662109375, -16.5927734375, -15.64892578125, -14.705078125, -13.76123046875, -12.8173828125, -11.87353515625, -10.9296875, -9.98583984375, -9.0419921875, -8.09814453125, -7.154296875, -6.21044921875, -5.2666015625, -4.32275390625, -3.37890625, -2.43505859375, -1.4912109375, -0.54736328125, 0.396484375, 1.34033203125, 2.2841796875, 3.22802734375, 4.171875, 5.11572265625, 6.0595703125, 7.00341796875, 7.947265625, 8.89111328125, 9.8349609375, 10.77880859375, 11.72265625, 12.66650390625, 13.6103515625, 14.55419921875, 15.498046875, 16.44189453125, 17.3857421875, 18.32958984375, 19.2734375, 20.21728515625, 21.1611328125, 22.10498046875, 23.048828125, 23.99267578125, 24.9365234375, 25.88037109375, 26.82421875, 27.76806640625, 28.7119140625, 29.65576171875, 30.599609375, 31.54345703125, 32.4873046875, 33.43115234375, 34.375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 11.0, 7.0, 15.0, 22.0, 37.0, 50.0, 79.0, 128.0, 223.0, 292.0, 464.0, 777.0, 1143.0, 1819.0, 2750.0, 4344.0, 6612.0, 10814.0, 16995.0, 26953.0, 42048.0, 64987.0, 97695.0, 137685.0, 164287.0, 148626.0, 110822.0, 74907.0, 48298.0, 31388.0, 19962.0, 12480.0, 7887.0, 4999.0, 3335.0, 1971.0, 1270.0, 844.0, 514.0, 337.0, 235.0, 154.0, 111.0, 61.0, 41.0, 31.0, 19.0, 10.0, 7.0, 7.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-85.8125, -83.013671875, -80.21484375, -77.416015625, -74.6171875, -71.818359375, -69.01953125, -66.220703125, -63.421875, -60.623046875, -57.82421875, -55.025390625, -52.2265625, -49.427734375, -46.62890625, -43.830078125, -41.03125, -38.232421875, -35.43359375, -32.634765625, -29.8359375, -27.037109375, -24.23828125, -21.439453125, -18.640625, -15.841796875, -13.04296875, -10.244140625, -7.4453125, -4.646484375, -1.84765625, 0.951171875, 3.75, 6.548828125, 9.34765625, 12.146484375, 14.9453125, 17.744140625, 20.54296875, 23.341796875, 26.140625, 28.939453125, 31.73828125, 34.537109375, 37.3359375, 40.134765625, 42.93359375, 45.732421875, 48.53125, 51.330078125, 54.12890625, 56.927734375, 59.7265625, 62.525390625, 65.32421875, 68.123046875, 70.921875, 73.720703125, 76.51953125, 79.318359375, 82.1171875, 84.916015625, 87.71484375, 90.513671875, 93.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 4.0, 6.0, 12.0, 9.0, 10.0, 15.0, 23.0, 21.0, 22.0, 31.0, 39.0, 28.0, 27.0, 32.0, 32.0, 43.0, 32.0, 40.0, 36.0, 53.0, 39.0, 34.0, 39.0, 25.0, 45.0, 37.0, 34.0, 37.0, 32.0, 19.0, 33.0, 14.0, 18.0, 14.0, 18.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.90625, -24.120849609375, -23.33544921875, -22.550048828125, -21.7646484375, -20.979248046875, -20.19384765625, -19.408447265625, -18.623046875, -17.837646484375, -17.05224609375, -16.266845703125, -15.4814453125, -14.696044921875, -13.91064453125, -13.125244140625, -12.33984375, -11.554443359375, -10.76904296875, -9.983642578125, -9.1982421875, -8.412841796875, -7.62744140625, -6.842041015625, -6.056640625, -5.271240234375, -4.48583984375, -3.700439453125, -2.9150390625, -2.129638671875, -1.34423828125, -0.558837890625, 0.2265625, 1.011962890625, 1.79736328125, 2.582763671875, 3.3681640625, 4.153564453125, 4.93896484375, 5.724365234375, 6.509765625, 7.295166015625, 8.08056640625, 8.865966796875, 9.6513671875, 10.436767578125, 11.22216796875, 12.007568359375, 12.79296875, 13.578369140625, 14.36376953125, 15.149169921875, 15.9345703125, 16.719970703125, 17.50537109375, 18.290771484375, 19.076171875, 19.861572265625, 20.64697265625, 21.432373046875, 22.2177734375, 23.003173828125, 23.78857421875, 24.573974609375, 25.359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 9.0, 3.0, 21.0, 19.0, 31.0, 47.0, 72.0, 116.0, 203.0, 257.0, 406.0, 705.0, 1071.0, 1913.0, 3293.0, 5575.0, 10386.0, 20794.0, 42230.0, 92834.0, 200315.0, 296512.0, 195698.0, 90666.0, 41582.0, 19846.0, 10468.0, 5587.0, 3062.0, 1796.0, 1095.0, 682.0, 417.0, 322.0, 165.0, 126.0, 75.0, 47.0, 36.0, 24.0, 15.0, 12.0, 6.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.5, -40.04296875, -38.5859375, -37.12890625, -35.671875, -34.21484375, -32.7578125, -31.30078125, -29.84375, -28.38671875, -26.9296875, -25.47265625, -24.015625, -22.55859375, -21.1015625, -19.64453125, -18.1875, -16.73046875, -15.2734375, -13.81640625, -12.359375, -10.90234375, -9.4453125, -7.98828125, -6.53125, -5.07421875, -3.6171875, -2.16015625, -0.703125, 0.75390625, 2.2109375, 3.66796875, 5.125, 6.58203125, 8.0390625, 9.49609375, 10.953125, 12.41015625, 13.8671875, 15.32421875, 16.78125, 18.23828125, 19.6953125, 21.15234375, 22.609375, 24.06640625, 25.5234375, 26.98046875, 28.4375, 29.89453125, 31.3515625, 32.80859375, 34.265625, 35.72265625, 37.1796875, 38.63671875, 40.09375, 41.55078125, 43.0078125, 44.46484375, 45.921875, 47.37890625, 48.8359375, 50.29296875, 51.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 5.0, 0.0, 5.0, 1.0, 4.0, 1.0, 3.0, 3.0, 7.0, 2.0, 6.0, 9.0, 8.0, 12.0, 13.0, 15.0, 19.0, 24.0, 35.0, 44.0, 50.0, 62.0, 51.0, 71.0, 74.0, 71.0, 66.0, 56.0, 48.0, 50.0, 32.0, 34.0, 25.0, 16.0, 20.0, 9.0, 13.0, 6.0, 8.0, 11.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003421783447265625, -0.003303706645965576, -0.0031856298446655273, -0.0030675530433654785, -0.0029494762420654297, -0.002831399440765381, -0.002713322639465332, -0.002595245838165283, -0.0024771690368652344, -0.0023590922355651855, -0.0022410154342651367, -0.002122938632965088, -0.002004861831665039, -0.0018867850303649902, -0.0017687082290649414, -0.0016506314277648926, -0.0015325546264648438, -0.001414477825164795, -0.001296401023864746, -0.0011783242225646973, -0.0010602474212646484, -0.0009421706199645996, -0.0008240938186645508, -0.000706017017364502, -0.0005879402160644531, -0.0004698634147644043, -0.00035178661346435547, -0.00023370981216430664, -0.00011563301086425781, 2.4437904357910156e-06, 0.00012052059173583984, 0.00023859739303588867, 0.0003566741943359375, 0.00047475099563598633, 0.0005928277969360352, 0.000710904598236084, 0.0008289813995361328, 0.0009470582008361816, 0.0010651350021362305, 0.0011832118034362793, 0.0013012886047363281, 0.001419365406036377, 0.0015374422073364258, 0.0016555190086364746, 0.0017735958099365234, 0.0018916726112365723, 0.002009749412536621, 0.00212782621383667, 0.0022459030151367188, 0.0023639798164367676, 0.0024820566177368164, 0.0026001334190368652, 0.002718210220336914, 0.002836287021636963, 0.0029543638229370117, 0.0030724406242370605, 0.0031905174255371094, 0.003308594226837158, 0.003426671028137207, 0.003544747829437256, 0.0036628246307373047, 0.0037809014320373535, 0.0038989782333374023, 0.004017055034637451, 0.0041351318359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 14.0, 21.0, 15.0, 29.0, 48.0, 80.0, 123.0, 126.0, 183.0, 256.0, 447.0, 644.0, 953.0, 1603.0, 2326.0, 3756.0, 6031.0, 10112.0, 16767.0, 27515.0, 46265.0, 75687.0, 115679.0, 159103.0, 174306.0, 145375.0, 100308.0, 63155.0, 38271.0, 23132.0, 13623.0, 8346.0, 5139.0, 3155.0, 2095.0, 1297.0, 864.0, 540.0, 362.0, 239.0, 158.0, 135.0, 78.0, 69.0, 30.0, 34.0, 23.0, 12.0, 6.0, 6.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-28.3125, -27.408447265625, -26.50439453125, -25.600341796875, -24.6962890625, -23.792236328125, -22.88818359375, -21.984130859375, -21.080078125, -20.176025390625, -19.27197265625, -18.367919921875, -17.4638671875, -16.559814453125, -15.65576171875, -14.751708984375, -13.84765625, -12.943603515625, -12.03955078125, -11.135498046875, -10.2314453125, -9.327392578125, -8.42333984375, -7.519287109375, -6.615234375, -5.711181640625, -4.80712890625, -3.903076171875, -2.9990234375, -2.094970703125, -1.19091796875, -0.286865234375, 0.6171875, 1.521240234375, 2.42529296875, 3.329345703125, 4.2333984375, 5.137451171875, 6.04150390625, 6.945556640625, 7.849609375, 8.753662109375, 9.65771484375, 10.561767578125, 11.4658203125, 12.369873046875, 13.27392578125, 14.177978515625, 15.08203125, 15.986083984375, 16.89013671875, 17.794189453125, 18.6982421875, 19.602294921875, 20.50634765625, 21.410400390625, 22.314453125, 23.218505859375, 24.12255859375, 25.026611328125, 25.9306640625, 26.834716796875, 27.73876953125, 28.642822265625, 29.546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 8.0, 8.0, 14.0, 17.0, 9.0, 25.0, 24.0, 19.0, 32.0, 25.0, 24.0, 47.0, 47.0, 40.0, 50.0, 54.0, 60.0, 55.0, 50.0, 48.0, 42.0, 35.0, 37.0, 35.0, 23.0, 25.0, 20.0, 25.0, 22.0, 12.0, 5.0, 11.0, 12.0, 1.0, 6.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.6796875, -9.3359375, -8.9921875, -8.6484375, -8.3046875, -7.9609375, -7.6171875, -7.2734375, -6.9296875, -6.5859375, -6.2421875, -5.8984375, -5.5546875, -5.2109375, -4.8671875, -4.5234375, -4.1796875, -3.8359375, -3.4921875, -3.1484375, -2.8046875, -2.4609375, -2.1171875, -1.7734375, -1.4296875, -1.0859375, -0.7421875, -0.3984375, -0.0546875, 0.2890625, 0.6328125, 0.9765625, 1.3203125, 1.6640625, 2.0078125, 2.3515625, 2.6953125, 3.0390625, 3.3828125, 3.7265625, 4.0703125, 4.4140625, 4.7578125, 5.1015625, 5.4453125, 5.7890625, 6.1328125, 6.4765625, 6.8203125, 7.1640625, 7.5078125, 7.8515625, 8.1953125, 8.5390625, 8.8828125, 9.2265625, 9.5703125, 9.9140625, 10.2578125, 10.6015625, 10.9453125, 11.2890625, 11.6328125, 11.9765625, 12.3203125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 14.0, 9.0, 16.0, 22.0, 27.0, 22.0, 24.0, 28.0, 35.0, 31.0, 45.0, 45.0, 34.0, 51.0, 45.0, 36.0, 54.0, 49.0, 46.0, 40.0, 47.0, 35.0, 41.0, 26.0, 23.0, 20.0, 19.0, 14.0, 22.0, 15.0, 8.0, 8.0, 6.0, 6.0, 9.0, 5.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-32.449039459228516, -31.454389572143555, -30.459739685058594, -29.465089797973633, -28.470439910888672, -27.475788116455078, -26.481138229370117, -25.486488342285156, -24.491838455200195, -23.497188568115234, -22.502538681030273, -21.507888793945312, -20.51323699951172, -19.51858901977539, -18.523937225341797, -17.529287338256836, -16.534637451171875, -15.539987564086914, -14.545337677001953, -13.550686836242676, -12.556036949157715, -11.561387062072754, -10.566736221313477, -9.572086334228516, -8.577436447143555, -7.582786560058594, -6.588136196136475, -5.5934858322143555, -4.5988359451293945, -3.6041860580444336, -2.6095356941223145, -1.6148853302001953, -0.6202354431152344, 0.37441468238830566, 1.3690648078918457, 2.3637149333953857, 3.358365058898926, 4.353014945983887, 5.347665309906006, 6.342315673828125, 7.336965560913086, 8.331615447998047, 9.326265335083008, 10.320916175842285, 11.315566062927246, 12.310215950012207, 13.304866790771484, 14.299516677856445, 15.294166564941406, 16.288816452026367, 17.283466339111328, 18.27811622619629, 19.27276611328125, 20.267417907714844, 21.262067794799805, 22.256717681884766, 23.251367568969727, 24.246017456054688, 25.24066734313965, 26.23531723022461, 27.229969024658203, 28.22461700439453, 29.219268798828125, 30.213918685913086, 31.208568572998047]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 8.0, 14.0, 10.0, 13.0, 13.0, 28.0, 31.0, 35.0, 29.0, 34.0, 42.0, 31.0, 35.0, 48.0, 41.0, 47.0, 37.0, 46.0, 44.0, 38.0, 64.0, 36.0, 30.0, 27.0, 33.0, 25.0, 26.0, 18.0, 14.0, 21.0, 13.0, 15.0, 14.0, 7.0, 5.0, 7.0, 7.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.86933135986328, -29.865570068359375, -28.861806869506836, -27.85804557800293, -26.85428237915039, -25.850521087646484, -24.846759796142578, -23.842998504638672, -22.839235305786133, -21.835474014282227, -20.831710815429688, -19.82794952392578, -18.824188232421875, -17.820425033569336, -16.81666374206543, -15.812901496887207, -14.809139251708984, -13.805377006530762, -12.801614761352539, -11.797853469848633, -10.79409122467041, -9.790328979492188, -8.786567687988281, -7.782805442810059, -6.779043197631836, -5.775280952453613, -4.771519184112549, -3.7677571773529053, -2.7639951705932617, -1.760232925415039, -0.7564711570739746, 0.24729061126708984, 1.2510566711425781, 2.2548186779022217, 3.2585806846618652, 4.26234245300293, 5.266104698181152, 6.269866943359375, 7.2736287117004395, 8.277390480041504, 9.281152725219727, 10.28491497039795, 11.288677215576172, 12.292438507080078, 13.2962007522583, 14.299962997436523, 15.30372428894043, 16.30748748779297, 17.311248779296875, 18.31501007080078, 19.31877326965332, 20.322534561157227, 21.326297760009766, 22.330059051513672, 23.333820343017578, 24.337581634521484, 25.341344833374023, 26.34510612487793, 27.34886932373047, 28.352630615234375, 29.35639190673828, 30.36015510559082, 31.363916397094727, 32.367679595947266, 33.37144088745117]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 13.0, 11.0, 19.0, 29.0, 51.0, 82.0, 139.0, 252.0, 378.0, 594.0, 988.0, 1430.0, 2298.0, 3675.0, 5595.0, 8562.0, 12993.0, 19067.0, 27908.0, 39533.0, 53390.0, 68524.0, 84518.0, 96979.0, 104412.0, 103304.0, 95312.0, 82581.0, 67093.0, 51134.0, 37387.0, 26728.0, 18386.0, 12350.0, 8219.0, 5337.0, 3422.0, 2187.0, 1373.0, 876.0, 560.0, 317.0, 221.0, 150.0, 57.0, 52.0, 23.0, 26.0, 15.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -18.189208984375, -17.58154296875, -16.973876953125, -16.3662109375, -15.758544921875, -15.15087890625, -14.543212890625, -13.935546875, -13.327880859375, -12.72021484375, -12.112548828125, -11.5048828125, -10.897216796875, -10.28955078125, -9.681884765625, -9.07421875, -8.466552734375, -7.85888671875, -7.251220703125, -6.6435546875, -6.035888671875, -5.42822265625, -4.820556640625, -4.212890625, -3.605224609375, -2.99755859375, -2.389892578125, -1.7822265625, -1.174560546875, -0.56689453125, 0.040771484375, 0.6484375, 1.256103515625, 1.86376953125, 2.471435546875, 3.0791015625, 3.686767578125, 4.29443359375, 4.902099609375, 5.509765625, 6.117431640625, 6.72509765625, 7.332763671875, 7.9404296875, 8.548095703125, 9.15576171875, 9.763427734375, 10.37109375, 10.978759765625, 11.58642578125, 12.194091796875, 12.8017578125, 13.409423828125, 14.01708984375, 14.624755859375, 15.232421875, 15.840087890625, 16.44775390625, 17.055419921875, 17.6630859375, 18.270751953125, 18.87841796875, 19.486083984375, 20.09375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 5.0, 14.0, 5.0, 7.0, 16.0, 14.0, 32.0, 25.0, 26.0, 35.0, 26.0, 30.0, 32.0, 40.0, 28.0, 43.0, 40.0, 47.0, 49.0, 44.0, 35.0, 39.0, 40.0, 28.0, 27.0, 32.0, 31.0, 28.0, 29.0, 25.0, 14.0, 16.0, 18.0, 17.0, 10.0, 11.0, 8.0, 9.0, 3.0, 7.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-33.5625, -32.642822265625, -31.72314453125, -30.803466796875, -29.8837890625, -28.964111328125, -28.04443359375, -27.124755859375, -26.205078125, -25.285400390625, -24.36572265625, -23.446044921875, -22.5263671875, -21.606689453125, -20.68701171875, -19.767333984375, -18.84765625, -17.927978515625, -17.00830078125, -16.088623046875, -15.1689453125, -14.249267578125, -13.32958984375, -12.409912109375, -11.490234375, -10.570556640625, -9.65087890625, -8.731201171875, -7.8115234375, -6.891845703125, -5.97216796875, -5.052490234375, -4.1328125, -3.213134765625, -2.29345703125, -1.373779296875, -0.4541015625, 0.465576171875, 1.38525390625, 2.304931640625, 3.224609375, 4.144287109375, 5.06396484375, 5.983642578125, 6.9033203125, 7.822998046875, 8.74267578125, 9.662353515625, 10.58203125, 11.501708984375, 12.42138671875, 13.341064453125, 14.2607421875, 15.180419921875, 16.10009765625, 17.019775390625, 17.939453125, 18.859130859375, 19.77880859375, 20.698486328125, 21.6181640625, 22.537841796875, 23.45751953125, 24.377197265625, 25.296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 11.0, 12.0, 14.0, 23.0, 48.0, 80.0, 90.0, 176.0, 287.0, 501.0, 861.0, 1479.0, 2534.0, 4447.0, 7921.0, 13654.0, 23380.0, 38900.0, 62012.0, 91532.0, 123579.0, 144055.0, 146011.0, 126048.0, 95189.0, 65286.0, 41283.0, 24831.0, 14522.0, 8346.0, 4764.0, 2830.0, 1579.0, 934.0, 525.0, 339.0, 192.0, 104.0, 65.0, 44.0, 35.0, 13.0, 7.0, 6.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.25, -33.244384765625, -32.23876953125, -31.233154296875, -30.2275390625, -29.221923828125, -28.21630859375, -27.210693359375, -26.205078125, -25.199462890625, -24.19384765625, -23.188232421875, -22.1826171875, -21.177001953125, -20.17138671875, -19.165771484375, -18.16015625, -17.154541015625, -16.14892578125, -15.143310546875, -14.1376953125, -13.132080078125, -12.12646484375, -11.120849609375, -10.115234375, -9.109619140625, -8.10400390625, -7.098388671875, -6.0927734375, -5.087158203125, -4.08154296875, -3.075927734375, -2.0703125, -1.064697265625, -0.05908203125, 0.946533203125, 1.9521484375, 2.957763671875, 3.96337890625, 4.968994140625, 5.974609375, 6.980224609375, 7.98583984375, 8.991455078125, 9.9970703125, 11.002685546875, 12.00830078125, 13.013916015625, 14.01953125, 15.025146484375, 16.03076171875, 17.036376953125, 18.0419921875, 19.047607421875, 20.05322265625, 21.058837890625, 22.064453125, 23.070068359375, 24.07568359375, 25.081298828125, 26.0869140625, 27.092529296875, 28.09814453125, 29.103759765625, 30.109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 4.0, 7.0, 11.0, 8.0, 20.0, 23.0, 19.0, 35.0, 22.0, 24.0, 36.0, 31.0, 37.0, 45.0, 55.0, 40.0, 41.0, 46.0, 53.0, 60.0, 39.0, 51.0, 53.0, 37.0, 31.0, 32.0, 26.0, 31.0, 24.0, 11.0, 16.0, 9.0, 9.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.390625, -22.652099609375, -21.91357421875, -21.175048828125, -20.4365234375, -19.697998046875, -18.95947265625, -18.220947265625, -17.482421875, -16.743896484375, -16.00537109375, -15.266845703125, -14.5283203125, -13.789794921875, -13.05126953125, -12.312744140625, -11.57421875, -10.835693359375, -10.09716796875, -9.358642578125, -8.6201171875, -7.881591796875, -7.14306640625, -6.404541015625, -5.666015625, -4.927490234375, -4.18896484375, -3.450439453125, -2.7119140625, -1.973388671875, -1.23486328125, -0.496337890625, 0.2421875, 0.980712890625, 1.71923828125, 2.457763671875, 3.1962890625, 3.934814453125, 4.67333984375, 5.411865234375, 6.150390625, 6.888916015625, 7.62744140625, 8.365966796875, 9.1044921875, 9.843017578125, 10.58154296875, 11.320068359375, 12.05859375, 12.797119140625, 13.53564453125, 14.274169921875, 15.0126953125, 15.751220703125, 16.48974609375, 17.228271484375, 17.966796875, 18.705322265625, 19.44384765625, 20.182373046875, 20.9208984375, 21.659423828125, 22.39794921875, 23.136474609375, 23.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 5.0, 10.0, 9.0, 24.0, 33.0, 64.0, 64.0, 95.0, 140.0, 200.0, 289.0, 472.0, 780.0, 1257.0, 2137.0, 3434.0, 6301.0, 11060.0, 20265.0, 37428.0, 67418.0, 110845.0, 159219.0, 183895.0, 163585.0, 117354.0, 71685.0, 40245.0, 21997.0, 11828.0, 6771.0, 3719.0, 2219.0, 1307.0, 841.0, 553.0, 349.0, 195.0, 141.0, 89.0, 76.0, 50.0, 28.0, 18.0, 19.0, 15.0, 10.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.0234375, -12.5972900390625, -12.171142578125, -11.7449951171875, -11.31884765625, -10.8927001953125, -10.466552734375, -10.0404052734375, -9.6142578125, -9.1881103515625, -8.761962890625, -8.3358154296875, -7.90966796875, -7.4835205078125, -7.057373046875, -6.6312255859375, -6.205078125, -5.7789306640625, -5.352783203125, -4.9266357421875, -4.50048828125, -4.0743408203125, -3.648193359375, -3.2220458984375, -2.7958984375, -2.3697509765625, -1.943603515625, -1.5174560546875, -1.09130859375, -0.6651611328125, -0.239013671875, 0.1871337890625, 0.61328125, 1.0394287109375, 1.465576171875, 1.8917236328125, 2.31787109375, 2.7440185546875, 3.170166015625, 3.5963134765625, 4.0224609375, 4.4486083984375, 4.874755859375, 5.3009033203125, 5.72705078125, 6.1531982421875, 6.579345703125, 7.0054931640625, 7.431640625, 7.8577880859375, 8.283935546875, 8.7100830078125, 9.13623046875, 9.5623779296875, 9.988525390625, 10.4146728515625, 10.8408203125, 11.2669677734375, 11.693115234375, 12.1192626953125, 12.54541015625, 12.9715576171875, 13.397705078125, 13.8238525390625, 14.25]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 5.0, 16.0, 17.0, 34.0, 45.0, 40.0, 47.0, 64.0, 76.0, 76.0, 89.0, 97.0, 81.0, 56.0, 59.0, 49.0, 39.0, 27.0, 24.0, 15.0, 12.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022945404052734375, -0.002235323190689087, -0.0021761059761047363, -0.0021168887615203857, -0.002057671546936035, -0.0019984543323516846, -0.001939237117767334, -0.0018800199031829834, -0.0018208026885986328, -0.0017615854740142822, -0.0017023682594299316, -0.001643151044845581, -0.0015839338302612305, -0.0015247166156768799, -0.0014654994010925293, -0.0014062821865081787, -0.0013470649719238281, -0.0012878477573394775, -0.001228630542755127, -0.0011694133281707764, -0.0011101961135864258, -0.0010509788990020752, -0.0009917616844177246, -0.000932544469833374, -0.0008733272552490234, -0.0008141100406646729, -0.0007548928260803223, -0.0006956756114959717, -0.0006364583969116211, -0.0005772411823272705, -0.0005180239677429199, -0.00045880675315856934, -0.00039958953857421875, -0.00034037232398986816, -0.0002811551094055176, -0.000221937894821167, -0.0001627206802368164, -0.00010350346565246582, -4.4286251068115234e-05, 1.4930963516235352e-05, 7.414817810058594e-05, 0.00013336539268493652, 0.0001925826072692871, 0.0002517998218536377, 0.0003110170364379883, 0.00037023425102233887, 0.00042945146560668945, 0.00048866868019104, 0.0005478858947753906, 0.0006071031093597412, 0.0006663203239440918, 0.0007255375385284424, 0.000784754753112793, 0.0008439719676971436, 0.0009031891822814941, 0.0009624063968658447, 0.0010216236114501953, 0.001080840826034546, 0.0011400580406188965, 0.001199275255203247, 0.0012584924697875977, 0.0013177096843719482, 0.0013769268989562988, 0.0014361441135406494, 0.001495361328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 6.0, 9.0, 6.0, 9.0, 12.0, 22.0, 25.0, 43.0, 54.0, 83.0, 121.0, 205.0, 277.0, 489.0, 825.0, 1342.0, 2457.0, 4381.0, 7627.0, 13770.0, 24327.0, 41871.0, 69422.0, 105987.0, 141734.0, 161545.0, 152891.0, 119377.0, 81015.0, 50568.0, 29659.0, 16586.0, 9407.0, 5178.0, 2904.0, 1651.0, 1022.0, 583.0, 342.0, 242.0, 154.0, 108.0, 61.0, 52.0, 39.0, 31.0, 15.0, 9.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-11.546875, -11.1934814453125, -10.840087890625, -10.4866943359375, -10.13330078125, -9.7799072265625, -9.426513671875, -9.0731201171875, -8.7197265625, -8.3663330078125, -8.012939453125, -7.6595458984375, -7.30615234375, -6.9527587890625, -6.599365234375, -6.2459716796875, -5.892578125, -5.5391845703125, -5.185791015625, -4.8323974609375, -4.47900390625, -4.1256103515625, -3.772216796875, -3.4188232421875, -3.0654296875, -2.7120361328125, -2.358642578125, -2.0052490234375, -1.65185546875, -1.2984619140625, -0.945068359375, -0.5916748046875, -0.23828125, 0.1151123046875, 0.468505859375, 0.8218994140625, 1.17529296875, 1.5286865234375, 1.882080078125, 2.2354736328125, 2.5888671875, 2.9422607421875, 3.295654296875, 3.6490478515625, 4.00244140625, 4.3558349609375, 4.709228515625, 5.0626220703125, 5.416015625, 5.7694091796875, 6.122802734375, 6.4761962890625, 6.82958984375, 7.1829833984375, 7.536376953125, 7.8897705078125, 8.2431640625, 8.5965576171875, 8.949951171875, 9.3033447265625, 9.65673828125, 10.0101318359375, 10.363525390625, 10.7169189453125, 11.0703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 5.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 8.0, 9.0, 17.0, 8.0, 16.0, 30.0, 27.0, 27.0, 44.0, 27.0, 40.0, 50.0, 54.0, 45.0, 49.0, 57.0, 44.0, 53.0, 46.0, 52.0, 37.0, 34.0, 30.0, 25.0, 28.0, 26.0, 16.0, 14.0, 10.0, 5.0, 6.0, 3.0, 6.0, 7.0, 9.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.673553466796875, -2.56390380859375, -2.454254150390625, -2.3446044921875, -2.234954833984375, -2.12530517578125, -2.015655517578125, -1.906005859375, -1.796356201171875, -1.68670654296875, -1.577056884765625, -1.4674072265625, -1.357757568359375, -1.24810791015625, -1.138458251953125, -1.02880859375, -0.919158935546875, -0.80950927734375, -0.699859619140625, -0.5902099609375, -0.480560302734375, -0.37091064453125, -0.261260986328125, -0.151611328125, -0.041961669921875, 0.06768798828125, 0.177337646484375, 0.2869873046875, 0.396636962890625, 0.50628662109375, 0.615936279296875, 0.7255859375, 0.835235595703125, 0.94488525390625, 1.054534912109375, 1.1641845703125, 1.273834228515625, 1.38348388671875, 1.493133544921875, 1.602783203125, 1.712432861328125, 1.82208251953125, 1.931732177734375, 2.0413818359375, 2.151031494140625, 2.26068115234375, 2.370330810546875, 2.47998046875, 2.589630126953125, 2.69927978515625, 2.808929443359375, 2.9185791015625, 3.028228759765625, 3.13787841796875, 3.247528076171875, 3.357177734375, 3.466827392578125, 3.57647705078125, 3.686126708984375, 3.7957763671875, 3.905426025390625, 4.01507568359375, 4.124725341796875, 4.234375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 9.0, 13.0, 8.0, 9.0, 19.0, 21.0, 26.0, 21.0, 28.0, 27.0, 39.0, 39.0, 40.0, 43.0, 54.0, 41.0, 47.0, 46.0, 49.0, 42.0, 31.0, 36.0, 47.0, 31.0, 22.0, 30.0, 31.0, 22.0, 21.0, 22.0, 18.0, 11.0, 5.0, 11.0, 5.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-33.03375244140625, -32.07163619995117, -31.10952377319336, -30.147409439086914, -29.18529510498047, -28.223180770874023, -27.261066436767578, -26.2989501953125, -25.336837768554688, -24.374723434448242, -23.412609100341797, -22.45049476623535, -21.488380432128906, -20.52626609802246, -19.564151763916016, -18.602035522460938, -17.639921188354492, -16.677806854248047, -15.715692520141602, -14.753578186035156, -13.791463851928711, -12.829349517822266, -11.867234230041504, -10.905119895935059, -9.943005561828613, -8.980891227722168, -8.018776893615723, -7.056662082672119, -6.094547748565674, -5.1324334144592285, -4.170318603515625, -3.2082042694091797, -2.2460899353027344, -1.2839754819869995, -0.32186102867126465, 0.6402535438537598, 1.602367877960205, 2.5644822120666504, 3.526597023010254, 4.488711357116699, 5.4508256912231445, 6.41294002532959, 7.375054359436035, 8.337169647216797, 9.299283981323242, 10.261398315429688, 11.223512649536133, 12.185626983642578, 13.147741317749023, 14.109855651855469, 15.071969985961914, 16.03408432006836, 16.996198654174805, 17.95831298828125, 18.920429229736328, 19.88254165649414, 20.84465789794922, 21.806772232055664, 22.76888656616211, 23.731000900268555, 24.693115234375, 25.655229568481445, 26.61734390258789, 27.57946014404297, 28.54157257080078]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 4.0, 4.0, 1.0, 8.0, 3.0, 5.0, 6.0, 10.0, 15.0, 16.0, 9.0, 12.0, 21.0, 15.0, 24.0, 20.0, 21.0, 17.0, 25.0, 31.0, 34.0, 39.0, 47.0, 45.0, 40.0, 37.0, 28.0, 34.0, 37.0, 32.0, 30.0, 28.0, 32.0, 32.0, 27.0, 32.0, 28.0, 23.0, 22.0, 17.0, 15.0, 8.0, 14.0, 17.0, 4.0, 7.0, 5.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.801513671875, -23.95681381225586, -23.112112045288086, -22.267412185668945, -21.422712326049805, -20.57801055908203, -19.73331069946289, -18.88861083984375, -18.043909072875977, -17.199209213256836, -16.354507446289062, -15.509807586669922, -14.665106773376465, -13.820405960083008, -12.975706100463867, -12.13100528717041, -11.28630542755127, -10.441604614257812, -9.596904754638672, -8.752203941345215, -7.907503128051758, -7.062802791595459, -6.21810245513916, -5.373401641845703, -4.528701305389404, -3.6840007305145264, -2.8393001556396484, -1.9945998191833496, -1.1498992443084717, -0.30519866943359375, 0.5395016670227051, 1.384202480316162, 2.228902816772461, 3.073603391647339, 3.918303966522217, 4.763004302978516, 5.607705116271973, 6.4524054527282715, 7.29710578918457, 8.141806602478027, 8.986507415771484, 9.831208229064941, 10.675908088684082, 11.520608901977539, 12.365309715270996, 13.210010528564453, 14.054710388183594, 14.89941120147705, 15.744111061096191, 16.58881187438965, 17.43351173400879, 18.278213500976562, 19.122913360595703, 19.967613220214844, 20.812313079833984, 21.657014846801758, 22.5017147064209, 23.34641456604004, 24.191116333007812, 25.035816192626953, 25.880516052246094, 26.725217819213867, 27.569917678833008, 28.41461944580078, 29.259319305419922]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 7.0, 18.0, 30.0, 45.0, 87.0, 120.0, 202.0, 325.0, 594.0, 1104.0, 2123.0, 4023.0, 7329.0, 13809.0, 26628.0, 52139.0, 100010.0, 190312.0, 345753.0, 559487.0, 740565.0, 756360.0, 589646.0, 370827.0, 205812.0, 108361.0, 56410.0, 28868.0, 15437.0, 8123.0, 4317.0, 2284.0, 1275.0, 810.0, 439.0, 227.0, 138.0, 97.0, 58.0, 31.0, 12.0, 17.0, 11.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.0625, -31.148193359375, -30.23388671875, -29.319580078125, -28.4052734375, -27.490966796875, -26.57666015625, -25.662353515625, -24.748046875, -23.833740234375, -22.91943359375, -22.005126953125, -21.0908203125, -20.176513671875, -19.26220703125, -18.347900390625, -17.43359375, -16.519287109375, -15.60498046875, -14.690673828125, -13.7763671875, -12.862060546875, -11.94775390625, -11.033447265625, -10.119140625, -9.204833984375, -8.29052734375, -7.376220703125, -6.4619140625, -5.547607421875, -4.63330078125, -3.718994140625, -2.8046875, -1.890380859375, -0.97607421875, -0.061767578125, 0.8525390625, 1.766845703125, 2.68115234375, 3.595458984375, 4.509765625, 5.424072265625, 6.33837890625, 7.252685546875, 8.1669921875, 9.081298828125, 9.99560546875, 10.909912109375, 11.82421875, 12.738525390625, 13.65283203125, 14.567138671875, 15.4814453125, 16.395751953125, 17.31005859375, 18.224365234375, 19.138671875, 20.052978515625, 20.96728515625, 21.881591796875, 22.7958984375, 23.710205078125, 24.62451171875, 25.538818359375, 26.453125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 9.0, 8.0, 5.0, 4.0, 13.0, 8.0, 22.0, 9.0, 18.0, 10.0, 19.0, 16.0, 19.0, 34.0, 46.0, 21.0, 34.0, 25.0, 42.0, 31.0, 47.0, 33.0, 32.0, 29.0, 30.0, 37.0, 30.0, 33.0, 37.0, 32.0, 30.0, 20.0, 23.0, 26.0, 16.0, 20.0, 21.0, 18.0, 18.0, 9.0, 9.0, 7.0, 7.0, 7.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-22.796875, -22.106201171875, -21.41552734375, -20.724853515625, -20.0341796875, -19.343505859375, -18.65283203125, -17.962158203125, -17.271484375, -16.580810546875, -15.89013671875, -15.199462890625, -14.5087890625, -13.818115234375, -13.12744140625, -12.436767578125, -11.74609375, -11.055419921875, -10.36474609375, -9.674072265625, -8.9833984375, -8.292724609375, -7.60205078125, -6.911376953125, -6.220703125, -5.530029296875, -4.83935546875, -4.148681640625, -3.4580078125, -2.767333984375, -2.07666015625, -1.385986328125, -0.6953125, -0.004638671875, 0.68603515625, 1.376708984375, 2.0673828125, 2.758056640625, 3.44873046875, 4.139404296875, 4.830078125, 5.520751953125, 6.21142578125, 6.902099609375, 7.5927734375, 8.283447265625, 8.97412109375, 9.664794921875, 10.35546875, 11.046142578125, 11.73681640625, 12.427490234375, 13.1181640625, 13.808837890625, 14.49951171875, 15.190185546875, 15.880859375, 16.571533203125, 17.26220703125, 17.952880859375, 18.6435546875, 19.334228515625, 20.02490234375, 20.715576171875, 21.40625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 8.0, 2.0, 9.0, 17.0, 17.0, 37.0, 40.0, 73.0, 106.0, 197.0, 316.0, 529.0, 994.0, 1729.0, 2889.0, 5316.0, 9505.0, 17268.0, 31521.0, 56822.0, 100768.0, 175142.0, 288372.0, 440116.0, 594245.0, 667275.0, 607229.0, 458223.0, 304731.0, 186368.0, 107804.0, 61001.0, 33591.0, 18732.0, 10375.0, 5579.0, 3150.0, 1732.0, 1018.0, 603.0, 350.0, 211.0, 111.0, 67.0, 31.0, 26.0, 17.0, 11.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.1875, -25.2705078125, -24.353515625, -23.4365234375, -22.51953125, -21.6025390625, -20.685546875, -19.7685546875, -18.8515625, -17.9345703125, -17.017578125, -16.1005859375, -15.18359375, -14.2666015625, -13.349609375, -12.4326171875, -11.515625, -10.5986328125, -9.681640625, -8.7646484375, -7.84765625, -6.9306640625, -6.013671875, -5.0966796875, -4.1796875, -3.2626953125, -2.345703125, -1.4287109375, -0.51171875, 0.4052734375, 1.322265625, 2.2392578125, 3.15625, 4.0732421875, 4.990234375, 5.9072265625, 6.82421875, 7.7412109375, 8.658203125, 9.5751953125, 10.4921875, 11.4091796875, 12.326171875, 13.2431640625, 14.16015625, 15.0771484375, 15.994140625, 16.9111328125, 17.828125, 18.7451171875, 19.662109375, 20.5791015625, 21.49609375, 22.4130859375, 23.330078125, 24.2470703125, 25.1640625, 26.0810546875, 26.998046875, 27.9150390625, 28.83203125, 29.7490234375, 30.666015625, 31.5830078125, 32.5]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 9.0, 5.0, 6.0, 14.0, 8.0, 5.0, 15.0, 24.0, 31.0, 35.0, 41.0, 48.0, 60.0, 65.0, 92.0, 117.0, 121.0, 133.0, 184.0, 194.0, 196.0, 214.0, 230.0, 216.0, 226.0, 211.0, 206.0, 171.0, 179.0, 123.0, 157.0, 139.0, 118.0, 75.0, 80.0, 71.0, 67.0, 43.0, 33.0, 29.0, 26.0, 21.0, 9.0, 9.0, 8.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.1640625, -10.825927734375, -10.48779296875, -10.149658203125, -9.8115234375, -9.473388671875, -9.13525390625, -8.797119140625, -8.458984375, -8.120849609375, -7.78271484375, -7.444580078125, -7.1064453125, -6.768310546875, -6.43017578125, -6.092041015625, -5.75390625, -5.415771484375, -5.07763671875, -4.739501953125, -4.4013671875, -4.063232421875, -3.72509765625, -3.386962890625, -3.048828125, -2.710693359375, -2.37255859375, -2.034423828125, -1.6962890625, -1.358154296875, -1.02001953125, -0.681884765625, -0.34375, -0.005615234375, 0.33251953125, 0.670654296875, 1.0087890625, 1.346923828125, 1.68505859375, 2.023193359375, 2.361328125, 2.699462890625, 3.03759765625, 3.375732421875, 3.7138671875, 4.052001953125, 4.39013671875, 4.728271484375, 5.06640625, 5.404541015625, 5.74267578125, 6.080810546875, 6.4189453125, 6.757080078125, 7.09521484375, 7.433349609375, 7.771484375, 8.109619140625, 8.44775390625, 8.785888671875, 9.1240234375, 9.462158203125, 9.80029296875, 10.138427734375, 10.4765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 7.0, 3.0, 3.0, 8.0, 8.0, 7.0, 10.0, 18.0, 18.0, 16.0, 14.0, 20.0, 19.0, 28.0, 29.0, 29.0, 28.0, 36.0, 38.0, 37.0, 51.0, 31.0, 42.0, 39.0, 38.0, 41.0, 45.0, 31.0, 32.0, 33.0, 29.0, 27.0, 26.0, 27.0, 29.0, 14.0, 13.0, 17.0, 12.0, 4.0, 7.0, 10.0, 8.0, 9.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.756084442138672, -23.90727424621582, -23.0584659576416, -22.20965576171875, -21.36084747314453, -20.51203727722168, -19.663227081298828, -18.81441879272461, -17.965608596801758, -17.116798400878906, -16.267990112304688, -15.419179916381836, -14.5703706741333, -13.721561431884766, -12.872751235961914, -12.023941993713379, -11.175132751464844, -10.326323509216309, -9.477514266967773, -8.628704071044922, -7.779894828796387, -6.931085586547852, -6.082275867462158, -5.233466148376465, -4.38465690612793, -3.5358474254608154, -2.687037944793701, -1.838228464126587, -0.9894189834594727, -0.1406097412109375, 0.7081999778747559, 1.5570096969604492, 2.4058170318603516, 3.254626512527466, 4.10343599319458, 4.952245712280273, 5.801054954528809, 6.649864196777344, 7.498673915863037, 8.34748363494873, 9.196292877197266, 10.0451021194458, 10.893911361694336, 11.742721557617188, 12.591530799865723, 13.440340042114258, 14.28915023803711, 15.137959480285645, 15.98676872253418, 16.83557891845703, 17.68438720703125, 18.5331974029541, 19.382007598876953, 20.230815887451172, 21.079626083374023, 21.928436279296875, 22.777244567871094, 23.626054763793945, 24.474863052368164, 25.323673248291016, 26.172481536865234, 27.021291732788086, 27.870101928710938, 28.718910217285156, 29.567720413208008]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 1.0, 7.0, 8.0, 6.0, 6.0, 15.0, 13.0, 13.0, 20.0, 15.0, 22.0, 20.0, 30.0, 24.0, 24.0, 28.0, 33.0, 24.0, 33.0, 28.0, 47.0, 38.0, 31.0, 41.0, 20.0, 43.0, 27.0, 44.0, 25.0, 29.0, 26.0, 27.0, 16.0, 30.0, 26.0, 19.0, 15.0, 18.0, 19.0, 5.0, 14.0, 6.0, 10.0, 10.0, 4.0, 6.0, 6.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-24.25715446472168, -23.493690490722656, -22.730226516723633, -21.96676254272461, -21.203298568725586, -20.439834594726562, -19.676368713378906, -18.912906646728516, -18.14944076538086, -17.385976791381836, -16.622512817382812, -15.859048843383789, -15.095584869384766, -14.332120895385742, -13.568655967712402, -12.805191993713379, -12.041728973388672, -11.278264999389648, -10.514801025390625, -9.751337051391602, -8.987873077392578, -8.224409103393555, -7.460944175720215, -6.697480201721191, -5.934016227722168, -5.1705522537231445, -4.407088279724121, -3.6436238288879395, -2.880159854888916, -2.1166958808898926, -1.353231430053711, -0.5897674560546875, 0.17369651794433594, 0.9371606111526489, 1.700624704360962, 2.4640889167785645, 3.227552890777588, 3.9910168647766113, 4.754481315612793, 5.517945289611816, 6.28140926361084, 7.044873237609863, 7.808337211608887, 8.571802139282227, 9.33526611328125, 10.098730087280273, 10.862194061279297, 11.62565803527832, 12.389122009277344, 13.152585983276367, 13.91604995727539, 14.679513931274414, 15.442977905273438, 16.20644187927246, 16.969905853271484, 17.73337173461914, 18.49683380126953, 19.260297775268555, 20.023761749267578, 20.7872257232666, 21.550689697265625, 22.31415367126465, 23.077617645263672, 23.841083526611328, 24.60454750061035]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 14.0, 17.0, 29.0, 43.0, 53.0, 81.0, 123.0, 159.0, 282.0, 393.0, 594.0, 833.0, 1275.0, 1854.0, 2745.0, 3865.0, 5683.0, 8205.0, 11625.0, 17106.0, 25578.0, 38783.0, 60526.0, 93438.0, 135092.0, 161952.0, 150534.0, 111621.0, 73596.0, 46933.0, 30738.0, 20449.0, 13612.0, 9306.0, 6557.0, 4571.0, 3223.0, 2280.0, 1523.0, 1048.0, 728.0, 520.0, 318.0, 232.0, 150.0, 101.0, 67.0, 34.0, 23.0, 16.0, 12.0, 6.0, 3.0, 6.0, 3.0, 2.0, 2.0], "bins": [-43.375, -42.04931640625, -40.7236328125, -39.39794921875, -38.072265625, -36.74658203125, -35.4208984375, -34.09521484375, -32.76953125, -31.44384765625, -30.1181640625, -28.79248046875, -27.466796875, -26.14111328125, -24.8154296875, -23.48974609375, -22.1640625, -20.83837890625, -19.5126953125, -18.18701171875, -16.861328125, -15.53564453125, -14.2099609375, -12.88427734375, -11.55859375, -10.23291015625, -8.9072265625, -7.58154296875, -6.255859375, -4.93017578125, -3.6044921875, -2.27880859375, -0.953125, 0.37255859375, 1.6982421875, 3.02392578125, 4.349609375, 5.67529296875, 7.0009765625, 8.32666015625, 9.65234375, 10.97802734375, 12.3037109375, 13.62939453125, 14.955078125, 16.28076171875, 17.6064453125, 18.93212890625, 20.2578125, 21.58349609375, 22.9091796875, 24.23486328125, 25.560546875, 26.88623046875, 28.2119140625, 29.53759765625, 30.86328125, 32.18896484375, 33.5146484375, 34.84033203125, 36.166015625, 37.49169921875, 38.8173828125, 40.14306640625, 41.46875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 7.0, 12.0, 10.0, 6.0, 11.0, 11.0, 20.0, 23.0, 23.0, 27.0, 29.0, 20.0, 46.0, 38.0, 37.0, 39.0, 33.0, 40.0, 35.0, 36.0, 34.0, 33.0, 44.0, 41.0, 31.0, 33.0, 34.0, 35.0, 21.0, 25.0, 22.0, 21.0, 19.0, 10.0, 18.0, 14.0, 10.0, 4.0, 4.0, 6.0, 4.0, 8.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.90625, -23.14208984375, -22.3779296875, -21.61376953125, -20.849609375, -20.08544921875, -19.3212890625, -18.55712890625, -17.79296875, -17.02880859375, -16.2646484375, -15.50048828125, -14.736328125, -13.97216796875, -13.2080078125, -12.44384765625, -11.6796875, -10.91552734375, -10.1513671875, -9.38720703125, -8.623046875, -7.85888671875, -7.0947265625, -6.33056640625, -5.56640625, -4.80224609375, -4.0380859375, -3.27392578125, -2.509765625, -1.74560546875, -0.9814453125, -0.21728515625, 0.546875, 1.31103515625, 2.0751953125, 2.83935546875, 3.603515625, 4.36767578125, 5.1318359375, 5.89599609375, 6.66015625, 7.42431640625, 8.1884765625, 8.95263671875, 9.716796875, 10.48095703125, 11.2451171875, 12.00927734375, 12.7734375, 13.53759765625, 14.3017578125, 15.06591796875, 15.830078125, 16.59423828125, 17.3583984375, 18.12255859375, 18.88671875, 19.65087890625, 20.4150390625, 21.17919921875, 21.943359375, 22.70751953125, 23.4716796875, 24.23583984375, 25.0]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 4.0, 11.0, 7.0, 17.0, 31.0, 50.0, 90.0, 109.0, 190.0, 263.0, 476.0, 699.0, 1177.0, 1790.0, 2912.0, 4752.0, 7779.0, 12707.0, 20913.0, 36419.0, 66457.0, 129119.0, 237475.0, 237352.0, 130019.0, 66781.0, 36457.0, 21224.0, 12769.0, 7752.0, 4858.0, 2948.0, 1822.0, 1109.0, 744.0, 481.0, 285.0, 185.0, 113.0, 78.0, 53.0, 27.0, 17.0, 15.0, 8.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.6875, -63.498046875, -61.30859375, -59.119140625, -56.9296875, -54.740234375, -52.55078125, -50.361328125, -48.171875, -45.982421875, -43.79296875, -41.603515625, -39.4140625, -37.224609375, -35.03515625, -32.845703125, -30.65625, -28.466796875, -26.27734375, -24.087890625, -21.8984375, -19.708984375, -17.51953125, -15.330078125, -13.140625, -10.951171875, -8.76171875, -6.572265625, -4.3828125, -2.193359375, -0.00390625, 2.185546875, 4.375, 6.564453125, 8.75390625, 10.943359375, 13.1328125, 15.322265625, 17.51171875, 19.701171875, 21.890625, 24.080078125, 26.26953125, 28.458984375, 30.6484375, 32.837890625, 35.02734375, 37.216796875, 39.40625, 41.595703125, 43.78515625, 45.974609375, 48.1640625, 50.353515625, 52.54296875, 54.732421875, 56.921875, 59.111328125, 61.30078125, 63.490234375, 65.6796875, 67.869140625, 70.05859375, 72.248046875, 74.4375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 14.0, 19.0, 18.0, 14.0, 24.0, 27.0, 35.0, 36.0, 34.0, 43.0, 37.0, 35.0, 40.0, 61.0, 51.0, 38.0, 56.0, 40.0, 54.0, 43.0, 41.0, 30.0, 28.0, 25.0, 31.0, 29.0, 22.0, 13.0, 16.0, 9.0, 7.0, 9.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.46875, -23.748046875, -23.02734375, -22.306640625, -21.5859375, -20.865234375, -20.14453125, -19.423828125, -18.703125, -17.982421875, -17.26171875, -16.541015625, -15.8203125, -15.099609375, -14.37890625, -13.658203125, -12.9375, -12.216796875, -11.49609375, -10.775390625, -10.0546875, -9.333984375, -8.61328125, -7.892578125, -7.171875, -6.451171875, -5.73046875, -5.009765625, -4.2890625, -3.568359375, -2.84765625, -2.126953125, -1.40625, -0.685546875, 0.03515625, 0.755859375, 1.4765625, 2.197265625, 2.91796875, 3.638671875, 4.359375, 5.080078125, 5.80078125, 6.521484375, 7.2421875, 7.962890625, 8.68359375, 9.404296875, 10.125, 10.845703125, 11.56640625, 12.287109375, 13.0078125, 13.728515625, 14.44921875, 15.169921875, 15.890625, 16.611328125, 17.33203125, 18.052734375, 18.7734375, 19.494140625, 20.21484375, 20.935546875, 21.65625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 10.0, 10.0, 10.0, 22.0, 23.0, 38.0, 38.0, 55.0, 65.0, 82.0, 121.0, 179.0, 228.0, 352.0, 524.0, 804.0, 1264.0, 2199.0, 3868.0, 7647.0, 17102.0, 41175.0, 112340.0, 292150.0, 333060.0, 143216.0, 51240.0, 20256.0, 9089.0, 4536.0, 2505.0, 1484.0, 897.0, 607.0, 380.0, 269.0, 212.0, 114.0, 104.0, 77.0, 65.0, 42.0, 30.0, 19.0, 15.0, 12.0, 7.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.0625, -38.77490234375, -37.4873046875, -36.19970703125, -34.912109375, -33.62451171875, -32.3369140625, -31.04931640625, -29.76171875, -28.47412109375, -27.1865234375, -25.89892578125, -24.611328125, -23.32373046875, -22.0361328125, -20.74853515625, -19.4609375, -18.17333984375, -16.8857421875, -15.59814453125, -14.310546875, -13.02294921875, -11.7353515625, -10.44775390625, -9.16015625, -7.87255859375, -6.5849609375, -5.29736328125, -4.009765625, -2.72216796875, -1.4345703125, -0.14697265625, 1.140625, 2.42822265625, 3.7158203125, 5.00341796875, 6.291015625, 7.57861328125, 8.8662109375, 10.15380859375, 11.44140625, 12.72900390625, 14.0166015625, 15.30419921875, 16.591796875, 17.87939453125, 19.1669921875, 20.45458984375, 21.7421875, 23.02978515625, 24.3173828125, 25.60498046875, 26.892578125, 28.18017578125, 29.4677734375, 30.75537109375, 32.04296875, 33.33056640625, 34.6181640625, 35.90576171875, 37.193359375, 38.48095703125, 39.7685546875, 41.05615234375, 42.34375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 14.0, 9.0, 9.0, 23.0, 30.0, 51.0, 80.0, 132.0, 210.0, 165.0, 102.0, 61.0, 39.0, 14.0, 11.0, 12.0, 6.0, 2.0, 2.0, 6.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006015777587890625, -0.005842745304107666, -0.005669713020324707, -0.005496680736541748, -0.005323648452758789, -0.00515061616897583, -0.004977583885192871, -0.004804551601409912, -0.004631519317626953, -0.004458487033843994, -0.004285454750061035, -0.004112422466278076, -0.003939390182495117, -0.003766357898712158, -0.0035933256149291992, -0.0034202933311462402, -0.0032472610473632812, -0.0030742287635803223, -0.0029011964797973633, -0.0027281641960144043, -0.0025551319122314453, -0.0023820996284484863, -0.0022090673446655273, -0.0020360350608825684, -0.0018630027770996094, -0.0016899704933166504, -0.0015169382095336914, -0.0013439059257507324, -0.0011708736419677734, -0.0009978413581848145, -0.0008248090744018555, -0.0006517767906188965, -0.0004787445068359375, -0.0003057122230529785, -0.00013267993927001953, 4.035234451293945e-05, 0.00021338462829589844, 0.0003864169120788574, 0.0005594491958618164, 0.0007324814796447754, 0.0009055137634277344, 0.0010785460472106934, 0.0012515783309936523, 0.0014246106147766113, 0.0015976428985595703, 0.0017706751823425293, 0.0019437074661254883, 0.0021167397499084473, 0.0022897720336914062, 0.0024628043174743652, 0.0026358366012573242, 0.002808868885040283, 0.002981901168823242, 0.003154933452606201, 0.00332796573638916, 0.003500998020172119, 0.003674030303955078, 0.003847062587738037, 0.004020094871520996, 0.004193127155303955, 0.004366159439086914, 0.004539191722869873, 0.004712224006652832, 0.004885256290435791, 0.00505828857421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 9.0, 17.0, 12.0, 18.0, 24.0, 37.0, 48.0, 63.0, 113.0, 133.0, 233.0, 289.0, 489.0, 824.0, 1387.0, 2209.0, 3677.0, 6462.0, 12362.0, 24904.0, 51652.0, 103560.0, 182574.0, 235642.0, 193034.0, 113546.0, 56998.0, 27318.0, 13691.0, 7103.0, 3864.0, 2336.0, 1348.0, 828.0, 561.0, 372.0, 231.0, 170.0, 107.0, 96.0, 64.0, 40.0, 33.0, 25.0, 10.0, 12.0, 5.0, 7.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.84375, -25.965576171875, -25.08740234375, -24.209228515625, -23.3310546875, -22.452880859375, -21.57470703125, -20.696533203125, -19.818359375, -18.940185546875, -18.06201171875, -17.183837890625, -16.3056640625, -15.427490234375, -14.54931640625, -13.671142578125, -12.79296875, -11.914794921875, -11.03662109375, -10.158447265625, -9.2802734375, -8.402099609375, -7.52392578125, -6.645751953125, -5.767578125, -4.889404296875, -4.01123046875, -3.133056640625, -2.2548828125, -1.376708984375, -0.49853515625, 0.379638671875, 1.2578125, 2.135986328125, 3.01416015625, 3.892333984375, 4.7705078125, 5.648681640625, 6.52685546875, 7.405029296875, 8.283203125, 9.161376953125, 10.03955078125, 10.917724609375, 11.7958984375, 12.674072265625, 13.55224609375, 14.430419921875, 15.30859375, 16.186767578125, 17.06494140625, 17.943115234375, 18.8212890625, 19.699462890625, 20.57763671875, 21.455810546875, 22.333984375, 23.212158203125, 24.09033203125, 24.968505859375, 25.8466796875, 26.724853515625, 27.60302734375, 28.481201171875, 29.359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 7.0, 5.0, 17.0, 15.0, 19.0, 13.0, 26.0, 29.0, 46.0, 37.0, 48.0, 57.0, 64.0, 57.0, 58.0, 63.0, 63.0, 65.0, 46.0, 60.0, 32.0, 27.0, 19.0, 27.0, 11.0, 12.0, 13.0, 9.0, 14.0, 9.0, 5.0, 5.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.745361328125, -7.46728515625, -7.189208984375, -6.9111328125, -6.633056640625, -6.35498046875, -6.076904296875, -5.798828125, -5.520751953125, -5.24267578125, -4.964599609375, -4.6865234375, -4.408447265625, -4.13037109375, -3.852294921875, -3.57421875, -3.296142578125, -3.01806640625, -2.739990234375, -2.4619140625, -2.183837890625, -1.90576171875, -1.627685546875, -1.349609375, -1.071533203125, -0.79345703125, -0.515380859375, -0.2373046875, 0.040771484375, 0.31884765625, 0.596923828125, 0.875, 1.153076171875, 1.43115234375, 1.709228515625, 1.9873046875, 2.265380859375, 2.54345703125, 2.821533203125, 3.099609375, 3.377685546875, 3.65576171875, 3.933837890625, 4.2119140625, 4.489990234375, 4.76806640625, 5.046142578125, 5.32421875, 5.602294921875, 5.88037109375, 6.158447265625, 6.4365234375, 6.714599609375, 6.99267578125, 7.270751953125, 7.548828125, 7.826904296875, 8.10498046875, 8.383056640625, 8.6611328125, 8.939208984375, 9.21728515625, 9.495361328125, 9.7734375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 8.0, 4.0, 16.0, 16.0, 19.0, 24.0, 24.0, 28.0, 30.0, 33.0, 36.0, 39.0, 45.0, 50.0, 39.0, 45.0, 44.0, 57.0, 55.0, 49.0, 43.0, 40.0, 46.0, 31.0, 22.0, 18.0, 31.0, 18.0, 16.0, 15.0, 6.0, 14.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.85295867919922, -23.94821548461914, -23.043472290039062, -22.138729095458984, -21.233985900878906, -20.329242706298828, -19.424497604370117, -18.51975440979004, -17.61501121520996, -16.710268020629883, -15.805524826049805, -14.90078067779541, -13.996037483215332, -13.091294288635254, -12.18655014038086, -11.281806945800781, -10.377063751220703, -9.472320556640625, -8.567577362060547, -7.662833213806152, -6.758090019226074, -5.853346824645996, -4.94860315322876, -4.043859481811523, -3.1391162872314453, -2.234372854232788, -1.3296294212341309, -0.42488598823547363, 0.4798574447631836, 1.3846006393432617, 2.289344310760498, 3.1940879821777344, 4.0988311767578125, 5.003574371337891, 5.908318042755127, 6.813061714172363, 7.717804908752441, 8.62254810333252, 9.527292251586914, 10.432035446166992, 11.33677864074707, 12.241521835327148, 13.146265029907227, 14.051009178161621, 14.9557523727417, 15.860495567321777, 16.765239715576172, 17.66998291015625, 18.574726104736328, 19.479469299316406, 20.384212493896484, 21.288955688476562, 22.19369888305664, 23.09844207763672, 24.00318717956543, 24.907930374145508, 25.812673568725586, 26.717416763305664, 27.622159957885742, 28.52690315246582, 29.43164825439453, 30.33639144897461, 31.241134643554688, 32.145877838134766, 33.050621032714844]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 3.0, 2.0, 6.0, 7.0, 6.0, 11.0, 9.0, 12.0, 7.0, 19.0, 20.0, 15.0, 28.0, 20.0, 21.0, 30.0, 29.0, 24.0, 30.0, 36.0, 35.0, 37.0, 34.0, 36.0, 42.0, 31.0, 36.0, 37.0, 32.0, 30.0, 24.0, 28.0, 32.0, 15.0, 35.0, 20.0, 19.0, 22.0, 20.0, 14.0, 13.0, 12.0, 11.0, 11.0, 8.0, 6.0, 7.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.898344039916992, -20.2132511138916, -19.52815818786621, -18.843063354492188, -18.157970428466797, -17.472877502441406, -16.787784576416016, -16.102691650390625, -15.417598724365234, -14.732505798339844, -14.047411918640137, -13.362318992614746, -12.677226066589355, -11.992132186889648, -11.307039260864258, -10.621946334838867, -9.93685245513916, -9.25175952911377, -8.566665649414062, -7.881572723388672, -7.196479797363281, -6.511386394500732, -5.826292991638184, -5.141200065612793, -4.456106662750244, -3.7710134983062744, -3.0859203338623047, -2.400826930999756, -1.7157337665557861, -1.0306406021118164, -0.3455471992492676, 0.33954572677612305, 1.0246391296386719, 1.7097322940826416, 2.3948254585266113, 3.07991886138916, 3.76501202583313, 4.4501051902771, 5.135198593139648, 5.820291519165039, 6.505384922027588, 7.190478324890137, 7.875571250915527, 8.560665130615234, 9.245758056640625, 9.930850982666016, 10.615943908691406, 11.301036834716797, 11.986130714416504, 12.671223640441895, 13.356317520141602, 14.041410446166992, 14.726503372192383, 15.411596298217773, 16.096691131591797, 16.781784057617188, 17.466876983642578, 18.15196990966797, 18.83706283569336, 19.52215576171875, 20.207250595092773, 20.892343521118164, 21.577436447143555, 22.262529373168945, 22.947622299194336]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 10.0, 10.0, 19.0, 20.0, 27.0, 44.0, 68.0, 114.0, 170.0, 276.0, 486.0, 733.0, 1186.0, 1797.0, 2699.0, 4052.0, 6171.0, 9308.0, 14219.0, 20868.0, 30101.0, 42394.0, 57308.0, 74096.0, 90735.0, 103175.0, 108048.0, 104701.0, 93728.0, 77473.0, 60651.0, 45199.0, 31941.0, 22033.0, 15192.0, 9982.0, 6777.0, 4372.0, 2931.0, 1953.0, 1217.0, 810.0, 538.0, 343.0, 208.0, 148.0, 71.0, 71.0, 31.0, 22.0, 14.0, 7.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0], "bins": [-18.890625, -18.31103515625, -17.7314453125, -17.15185546875, -16.572265625, -15.99267578125, -15.4130859375, -14.83349609375, -14.25390625, -13.67431640625, -13.0947265625, -12.51513671875, -11.935546875, -11.35595703125, -10.7763671875, -10.19677734375, -9.6171875, -9.03759765625, -8.4580078125, -7.87841796875, -7.298828125, -6.71923828125, -6.1396484375, -5.56005859375, -4.98046875, -4.40087890625, -3.8212890625, -3.24169921875, -2.662109375, -2.08251953125, -1.5029296875, -0.92333984375, -0.34375, 0.23583984375, 0.8154296875, 1.39501953125, 1.974609375, 2.55419921875, 3.1337890625, 3.71337890625, 4.29296875, 4.87255859375, 5.4521484375, 6.03173828125, 6.611328125, 7.19091796875, 7.7705078125, 8.35009765625, 8.9296875, 9.50927734375, 10.0888671875, 10.66845703125, 11.248046875, 11.82763671875, 12.4072265625, 12.98681640625, 13.56640625, 14.14599609375, 14.7255859375, 15.30517578125, 15.884765625, 16.46435546875, 17.0439453125, 17.62353515625, 18.203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 4.0, 10.0, 8.0, 10.0, 18.0, 9.0, 17.0, 18.0, 21.0, 19.0, 12.0, 25.0, 34.0, 27.0, 31.0, 39.0, 35.0, 37.0, 46.0, 33.0, 34.0, 41.0, 43.0, 31.0, 37.0, 26.0, 29.0, 29.0, 30.0, 27.0, 25.0, 25.0, 27.0, 12.0, 18.0, 13.0, 18.0, 12.0, 9.0, 12.0, 5.0, 8.0, 8.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.03125, -21.316650390625, -20.60205078125, -19.887451171875, -19.1728515625, -18.458251953125, -17.74365234375, -17.029052734375, -16.314453125, -15.599853515625, -14.88525390625, -14.170654296875, -13.4560546875, -12.741455078125, -12.02685546875, -11.312255859375, -10.59765625, -9.883056640625, -9.16845703125, -8.453857421875, -7.7392578125, -7.024658203125, -6.31005859375, -5.595458984375, -4.880859375, -4.166259765625, -3.45166015625, -2.737060546875, -2.0224609375, -1.307861328125, -0.59326171875, 0.121337890625, 0.8359375, 1.550537109375, 2.26513671875, 2.979736328125, 3.6943359375, 4.408935546875, 5.12353515625, 5.838134765625, 6.552734375, 7.267333984375, 7.98193359375, 8.696533203125, 9.4111328125, 10.125732421875, 10.84033203125, 11.554931640625, 12.26953125, 12.984130859375, 13.69873046875, 14.413330078125, 15.1279296875, 15.842529296875, 16.55712890625, 17.271728515625, 17.986328125, 18.700927734375, 19.41552734375, 20.130126953125, 20.8447265625, 21.559326171875, 22.27392578125, 22.988525390625, 23.703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 9.0, 13.0, 24.0, 37.0, 50.0, 88.0, 130.0, 196.0, 284.0, 408.0, 598.0, 985.0, 1490.0, 2278.0, 3346.0, 5005.0, 7648.0, 11157.0, 16809.0, 24074.0, 34290.0, 47410.0, 62793.0, 78861.0, 93102.0, 102523.0, 104871.0, 99923.0, 87258.0, 71955.0, 55763.0, 41519.0, 30099.0, 20841.0, 14211.0, 9478.0, 6501.0, 4251.0, 2819.0, 1873.0, 1195.0, 790.0, 521.0, 366.0, 251.0, 153.0, 114.0, 77.0, 34.0, 25.0, 19.0, 14.0, 10.0, 7.0, 3.0, 2.0, 0.0, 5.0], "bins": [-19.96875, -19.350341796875, -18.73193359375, -18.113525390625, -17.4951171875, -16.876708984375, -16.25830078125, -15.639892578125, -15.021484375, -14.403076171875, -13.78466796875, -13.166259765625, -12.5478515625, -11.929443359375, -11.31103515625, -10.692626953125, -10.07421875, -9.455810546875, -8.83740234375, -8.218994140625, -7.6005859375, -6.982177734375, -6.36376953125, -5.745361328125, -5.126953125, -4.508544921875, -3.89013671875, -3.271728515625, -2.6533203125, -2.034912109375, -1.41650390625, -0.798095703125, -0.1796875, 0.438720703125, 1.05712890625, 1.675537109375, 2.2939453125, 2.912353515625, 3.53076171875, 4.149169921875, 4.767578125, 5.385986328125, 6.00439453125, 6.622802734375, 7.2412109375, 7.859619140625, 8.47802734375, 9.096435546875, 9.71484375, 10.333251953125, 10.95166015625, 11.570068359375, 12.1884765625, 12.806884765625, 13.42529296875, 14.043701171875, 14.662109375, 15.280517578125, 15.89892578125, 16.517333984375, 17.1357421875, 17.754150390625, 18.37255859375, 18.990966796875, 19.609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 9.0, 11.0, 13.0, 8.0, 15.0, 12.0, 13.0, 20.0, 24.0, 29.0, 27.0, 21.0, 26.0, 31.0, 35.0, 31.0, 36.0, 41.0, 34.0, 31.0, 33.0, 38.0, 29.0, 36.0, 37.0, 42.0, 38.0, 37.0, 26.0, 28.0, 25.0, 21.0, 23.0, 17.0, 10.0, 14.0, 8.0, 9.0, 9.0, 12.0, 7.0, 4.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.796875, -14.319580078125, -13.84228515625, -13.364990234375, -12.8876953125, -12.410400390625, -11.93310546875, -11.455810546875, -10.978515625, -10.501220703125, -10.02392578125, -9.546630859375, -9.0693359375, -8.592041015625, -8.11474609375, -7.637451171875, -7.16015625, -6.682861328125, -6.20556640625, -5.728271484375, -5.2509765625, -4.773681640625, -4.29638671875, -3.819091796875, -3.341796875, -2.864501953125, -2.38720703125, -1.909912109375, -1.4326171875, -0.955322265625, -0.47802734375, -0.000732421875, 0.4765625, 0.953857421875, 1.43115234375, 1.908447265625, 2.3857421875, 2.863037109375, 3.34033203125, 3.817626953125, 4.294921875, 4.772216796875, 5.24951171875, 5.726806640625, 6.2041015625, 6.681396484375, 7.15869140625, 7.635986328125, 8.11328125, 8.590576171875, 9.06787109375, 9.545166015625, 10.0224609375, 10.499755859375, 10.97705078125, 11.454345703125, 11.931640625, 12.408935546875, 12.88623046875, 13.363525390625, 13.8408203125, 14.318115234375, 14.79541015625, 15.272705078125, 15.75]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 14.0, 11.0, 20.0, 27.0, 37.0, 53.0, 74.0, 101.0, 138.0, 200.0, 304.0, 415.0, 567.0, 808.0, 1253.0, 2127.0, 3753.0, 8023.0, 20649.0, 63546.0, 183668.0, 335125.0, 262921.0, 105824.0, 34209.0, 12090.0, 5089.0, 2604.0, 1598.0, 1020.0, 680.0, 474.0, 339.0, 248.0, 131.0, 126.0, 87.0, 61.0, 38.0, 37.0, 22.0, 11.0, 9.0, 11.0, 2.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-27.46875, -26.654296875, -25.83984375, -25.025390625, -24.2109375, -23.396484375, -22.58203125, -21.767578125, -20.953125, -20.138671875, -19.32421875, -18.509765625, -17.6953125, -16.880859375, -16.06640625, -15.251953125, -14.4375, -13.623046875, -12.80859375, -11.994140625, -11.1796875, -10.365234375, -9.55078125, -8.736328125, -7.921875, -7.107421875, -6.29296875, -5.478515625, -4.6640625, -3.849609375, -3.03515625, -2.220703125, -1.40625, -0.591796875, 0.22265625, 1.037109375, 1.8515625, 2.666015625, 3.48046875, 4.294921875, 5.109375, 5.923828125, 6.73828125, 7.552734375, 8.3671875, 9.181640625, 9.99609375, 10.810546875, 11.625, 12.439453125, 13.25390625, 14.068359375, 14.8828125, 15.697265625, 16.51171875, 17.326171875, 18.140625, 18.955078125, 19.76953125, 20.583984375, 21.3984375, 22.212890625, 23.02734375, 23.841796875, 24.65625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 11.0, 10.0, 12.0, 23.0, 27.0, 48.0, 54.0, 85.0, 91.0, 105.0, 92.0, 77.0, 85.0, 70.0, 44.0, 39.0, 30.0, 16.0, 16.0, 16.0, 4.0, 4.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002071380615234375, -0.0019976794719696045, -0.001923978328704834, -0.0018502771854400635, -0.001776576042175293, -0.0017028748989105225, -0.001629173755645752, -0.0015554726123809814, -0.001481771469116211, -0.0014080703258514404, -0.00133436918258667, -0.0012606680393218994, -0.001186966896057129, -0.0011132657527923584, -0.0010395646095275879, -0.0009658634662628174, -0.0008921623229980469, -0.0008184611797332764, -0.0007447600364685059, -0.0006710588932037354, -0.0005973577499389648, -0.0005236566066741943, -0.00044995546340942383, -0.0003762543201446533, -0.0003025531768798828, -0.0002288520336151123, -0.0001551508903503418, -8.144974708557129e-05, -7.748603820800781e-06, 6.595253944396973e-05, 0.00013965368270874023, 0.00021335482597351074, 0.00028705596923828125, 0.00036075711250305176, 0.00043445825576782227, 0.0005081593990325928, 0.0005818605422973633, 0.0006555616855621338, 0.0007292628288269043, 0.0008029639720916748, 0.0008766651153564453, 0.0009503662586212158, 0.0010240674018859863, 0.0010977685451507568, 0.0011714696884155273, 0.0012451708316802979, 0.0013188719749450684, 0.0013925731182098389, 0.0014662742614746094, 0.0015399754047393799, 0.0016136765480041504, 0.001687377691268921, 0.0017610788345336914, 0.001834779977798462, 0.0019084811210632324, 0.001982182264328003, 0.0020558834075927734, 0.002129584550857544, 0.0022032856941223145, 0.002276986837387085, 0.0023506879806518555, 0.002424389123916626, 0.0024980902671813965, 0.002571791410446167, 0.0026454925537109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 15.0, 16.0, 15.0, 33.0, 54.0, 83.0, 118.0, 187.0, 247.0, 368.0, 590.0, 1036.0, 1908.0, 3963.0, 9315.0, 26392.0, 74511.0, 181526.0, 288908.0, 253144.0, 128151.0, 48123.0, 16941.0, 6287.0, 2861.0, 1417.0, 827.0, 539.0, 300.0, 226.0, 145.0, 102.0, 70.0, 56.0, 22.0, 16.0, 12.0, 8.0, 7.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.859375, -20.203125, -19.546875, -18.890625, -18.234375, -17.578125, -16.921875, -16.265625, -15.609375, -14.953125, -14.296875, -13.640625, -12.984375, -12.328125, -11.671875, -11.015625, -10.359375, -9.703125, -9.046875, -8.390625, -7.734375, -7.078125, -6.421875, -5.765625, -5.109375, -4.453125, -3.796875, -3.140625, -2.484375, -1.828125, -1.171875, -0.515625, 0.140625, 0.796875, 1.453125, 2.109375, 2.765625, 3.421875, 4.078125, 4.734375, 5.390625, 6.046875, 6.703125, 7.359375, 8.015625, 8.671875, 9.328125, 9.984375, 10.640625, 11.296875, 11.953125, 12.609375, 13.265625, 13.921875, 14.578125, 15.234375, 15.890625, 16.546875, 17.203125, 17.859375, 18.515625, 19.171875, 19.828125, 20.484375, 21.140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 9.0, 17.0, 25.0, 27.0, 35.0, 47.0, 57.0, 71.0, 76.0, 79.0, 94.0, 87.0, 78.0, 60.0, 46.0, 53.0, 34.0, 25.0, 16.0, 13.0, 7.0, 4.0, 5.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.9765625, -5.801025390625, -5.62548828125, -5.449951171875, -5.2744140625, -5.098876953125, -4.92333984375, -4.747802734375, -4.572265625, -4.396728515625, -4.22119140625, -4.045654296875, -3.8701171875, -3.694580078125, -3.51904296875, -3.343505859375, -3.16796875, -2.992431640625, -2.81689453125, -2.641357421875, -2.4658203125, -2.290283203125, -2.11474609375, -1.939208984375, -1.763671875, -1.588134765625, -1.41259765625, -1.237060546875, -1.0615234375, -0.885986328125, -0.71044921875, -0.534912109375, -0.359375, -0.183837890625, -0.00830078125, 0.167236328125, 0.3427734375, 0.518310546875, 0.69384765625, 0.869384765625, 1.044921875, 1.220458984375, 1.39599609375, 1.571533203125, 1.7470703125, 1.922607421875, 2.09814453125, 2.273681640625, 2.44921875, 2.624755859375, 2.80029296875, 2.975830078125, 3.1513671875, 3.326904296875, 3.50244140625, 3.677978515625, 3.853515625, 4.029052734375, 4.20458984375, 4.380126953125, 4.5556640625, 4.731201171875, 4.90673828125, 5.082275390625, 5.2578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 7.0, 3.0, 14.0, 13.0, 21.0, 14.0, 22.0, 30.0, 30.0, 29.0, 18.0, 43.0, 47.0, 31.0, 36.0, 42.0, 46.0, 45.0, 47.0, 42.0, 40.0, 43.0, 50.0, 47.0, 34.0, 39.0, 10.0, 26.0, 21.0, 13.0, 13.0, 12.0, 12.0, 5.0, 13.0, 5.0, 6.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.16592025756836, -23.354825973510742, -22.543731689453125, -21.732637405395508, -20.92154312133789, -20.11044692993164, -19.299352645874023, -18.488258361816406, -17.67716407775879, -16.866069793701172, -16.054975509643555, -15.243880271911621, -14.432785987854004, -13.621691703796387, -12.810596466064453, -11.999502182006836, -11.188407897949219, -10.377313613891602, -9.566219329833984, -8.75512409210205, -7.944029808044434, -7.132935523986816, -6.321840763092041, -5.510746002197266, -4.699651718139648, -3.888557195663452, -3.077462673187256, -2.2663681507110596, -1.4552736282348633, -0.6441793441772461, 0.1669154167175293, 0.9780101776123047, 1.789102554321289, 2.6001970767974854, 3.4112915992736816, 4.222386360168457, 5.033480644226074, 5.844574928283691, 6.655669689178467, 7.466764450073242, 8.27785873413086, 9.088953018188477, 9.900047302246094, 10.711142539978027, 11.522236824035645, 12.333331108093262, 13.144426345825195, 13.955520629882812, 14.76661491394043, 15.577709197998047, 16.388803482055664, 17.19989776611328, 18.01099395751953, 18.822086334228516, 19.633182525634766, 20.444276809692383, 21.25537109375, 22.066465377807617, 22.877559661865234, 23.68865394592285, 24.49974822998047, 25.31084442138672, 26.121938705444336, 26.933032989501953, 27.74412727355957]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 7.0, 11.0, 11.0, 15.0, 15.0, 18.0, 22.0, 20.0, 17.0, 17.0, 29.0, 37.0, 38.0, 37.0, 37.0, 30.0, 46.0, 37.0, 34.0, 47.0, 45.0, 45.0, 42.0, 36.0, 35.0, 38.0, 27.0, 28.0, 31.0, 16.0, 23.0, 16.0, 16.0, 12.0, 15.0, 14.0, 11.0, 3.0, 8.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.236860275268555, -26.4128360748291, -25.588809967041016, -24.764785766601562, -23.94076156616211, -23.116737365722656, -22.29271125793457, -21.468687057495117, -20.64466094970703, -19.820636749267578, -18.996610641479492, -18.17258644104004, -17.348562240600586, -16.5245361328125, -15.700511932373047, -14.876487731933594, -14.05246353149414, -13.228438377380371, -12.404414176940918, -11.580389022827148, -10.756364822387695, -9.932339668273926, -9.108314514160156, -8.284290313720703, -7.460265159606934, -6.636240482330322, -5.812215805053711, -4.988190650939941, -4.16416597366333, -3.3401412963867188, -2.516116142272949, -1.692091464996338, -0.8680667877197266, -0.044041991233825684, 0.7799828052520752, 1.6040077209472656, 2.428032398223877, 3.2520570755004883, 4.076082229614258, 4.900106906890869, 5.7241315841674805, 6.548156261444092, 7.372180938720703, 8.196206092834473, 9.020231246948242, 9.844255447387695, 10.668280601501465, 11.492305755615234, 12.316329956054688, 13.140355110168457, 13.96437931060791, 14.78840446472168, 15.612428665161133, 16.43645477294922, 17.260478973388672, 18.084503173828125, 18.908527374267578, 19.73255157470703, 20.556577682495117, 21.38060188293457, 22.204626083374023, 23.02865219116211, 23.852676391601562, 24.676700592041016, 25.5007266998291]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 9.0, 19.0, 29.0, 58.0, 70.0, 121.0, 167.0, 332.0, 574.0, 995.0, 1555.0, 2638.0, 4492.0, 7874.0, 13407.0, 23532.0, 40860.0, 72894.0, 127632.0, 221480.0, 362476.0, 532182.0, 657062.0, 663211.0, 543861.0, 375245.0, 230213.0, 132729.0, 75911.0, 43043.0, 24478.0, 14472.0, 8343.0, 5015.0, 2844.0, 1755.0, 1106.0, 613.0, 364.0, 222.0, 146.0, 98.0, 70.0, 35.0, 23.0, 9.0, 12.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.765625, -19.107666015625, -18.44970703125, -17.791748046875, -17.1337890625, -16.475830078125, -15.81787109375, -15.159912109375, -14.501953125, -13.843994140625, -13.18603515625, -12.528076171875, -11.8701171875, -11.212158203125, -10.55419921875, -9.896240234375, -9.23828125, -8.580322265625, -7.92236328125, -7.264404296875, -6.6064453125, -5.948486328125, -5.29052734375, -4.632568359375, -3.974609375, -3.316650390625, -2.65869140625, -2.000732421875, -1.3427734375, -0.684814453125, -0.02685546875, 0.631103515625, 1.2890625, 1.947021484375, 2.60498046875, 3.262939453125, 3.9208984375, 4.578857421875, 5.23681640625, 5.894775390625, 6.552734375, 7.210693359375, 7.86865234375, 8.526611328125, 9.1845703125, 9.842529296875, 10.50048828125, 11.158447265625, 11.81640625, 12.474365234375, 13.13232421875, 13.790283203125, 14.4482421875, 15.106201171875, 15.76416015625, 16.422119140625, 17.080078125, 17.738037109375, 18.39599609375, 19.053955078125, 19.7119140625, 20.369873046875, 21.02783203125, 21.685791015625, 22.34375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 10.0, 10.0, 12.0, 10.0, 8.0, 13.0, 15.0, 22.0, 24.0, 23.0, 23.0, 37.0, 33.0, 40.0, 24.0, 44.0, 37.0, 34.0, 36.0, 64.0, 44.0, 48.0, 37.0, 40.0, 51.0, 33.0, 28.0, 28.0, 29.0, 24.0, 19.0, 18.0, 15.0, 18.0, 13.0, 7.0, 12.0, 5.0, 5.0, 12.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.421875, -25.6806640625, -24.939453125, -24.1982421875, -23.45703125, -22.7158203125, -21.974609375, -21.2333984375, -20.4921875, -19.7509765625, -19.009765625, -18.2685546875, -17.52734375, -16.7861328125, -16.044921875, -15.3037109375, -14.5625, -13.8212890625, -13.080078125, -12.3388671875, -11.59765625, -10.8564453125, -10.115234375, -9.3740234375, -8.6328125, -7.8916015625, -7.150390625, -6.4091796875, -5.66796875, -4.9267578125, -4.185546875, -3.4443359375, -2.703125, -1.9619140625, -1.220703125, -0.4794921875, 0.26171875, 1.0029296875, 1.744140625, 2.4853515625, 3.2265625, 3.9677734375, 4.708984375, 5.4501953125, 6.19140625, 6.9326171875, 7.673828125, 8.4150390625, 9.15625, 9.8974609375, 10.638671875, 11.3798828125, 12.12109375, 12.8623046875, 13.603515625, 14.3447265625, 15.0859375, 15.8271484375, 16.568359375, 17.3095703125, 18.05078125, 18.7919921875, 19.533203125, 20.2744140625, 21.015625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 6.0, 4.0, 13.0, 19.0, 41.0, 42.0, 115.0, 158.0, 291.0, 512.0, 852.0, 1551.0, 2731.0, 4886.0, 8984.0, 16455.0, 30622.0, 54682.0, 98273.0, 174592.0, 294325.0, 459663.0, 623123.0, 696672.0, 615902.0, 446152.0, 283698.0, 168222.0, 94836.0, 52351.0, 29294.0, 15770.0, 8554.0, 4797.0, 2711.0, 1457.0, 824.0, 456.0, 269.0, 162.0, 94.0, 56.0, 30.0, 12.0, 16.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.296875, -24.492919921875, -23.68896484375, -22.885009765625, -22.0810546875, -21.277099609375, -20.47314453125, -19.669189453125, -18.865234375, -18.061279296875, -17.25732421875, -16.453369140625, -15.6494140625, -14.845458984375, -14.04150390625, -13.237548828125, -12.43359375, -11.629638671875, -10.82568359375, -10.021728515625, -9.2177734375, -8.413818359375, -7.60986328125, -6.805908203125, -6.001953125, -5.197998046875, -4.39404296875, -3.590087890625, -2.7861328125, -1.982177734375, -1.17822265625, -0.374267578125, 0.4296875, 1.233642578125, 2.03759765625, 2.841552734375, 3.6455078125, 4.449462890625, 5.25341796875, 6.057373046875, 6.861328125, 7.665283203125, 8.46923828125, 9.273193359375, 10.0771484375, 10.881103515625, 11.68505859375, 12.489013671875, 13.29296875, 14.096923828125, 14.90087890625, 15.704833984375, 16.5087890625, 17.312744140625, 18.11669921875, 18.920654296875, 19.724609375, 20.528564453125, 21.33251953125, 22.136474609375, 22.9404296875, 23.744384765625, 24.54833984375, 25.352294921875, 26.15625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 2.0, 7.0, 8.0, 7.0, 9.0, 15.0, 21.0, 28.0, 32.0, 45.0, 50.0, 54.0, 67.0, 80.0, 87.0, 107.0, 116.0, 144.0, 161.0, 165.0, 186.0, 179.0, 215.0, 197.0, 214.0, 220.0, 193.0, 196.0, 194.0, 168.0, 129.0, 121.0, 135.0, 101.0, 76.0, 75.0, 46.0, 46.0, 36.0, 31.0, 24.0, 29.0, 10.0, 12.0, 14.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-9.6484375, -9.3719482421875, -9.095458984375, -8.8189697265625, -8.54248046875, -8.2659912109375, -7.989501953125, -7.7130126953125, -7.4365234375, -7.1600341796875, -6.883544921875, -6.6070556640625, -6.33056640625, -6.0540771484375, -5.777587890625, -5.5010986328125, -5.224609375, -4.9481201171875, -4.671630859375, -4.3951416015625, -4.11865234375, -3.8421630859375, -3.565673828125, -3.2891845703125, -3.0126953125, -2.7362060546875, -2.459716796875, -2.1832275390625, -1.90673828125, -1.6302490234375, -1.353759765625, -1.0772705078125, -0.80078125, -0.5242919921875, -0.247802734375, 0.0286865234375, 0.30517578125, 0.5816650390625, 0.858154296875, 1.1346435546875, 1.4111328125, 1.6876220703125, 1.964111328125, 2.2406005859375, 2.51708984375, 2.7935791015625, 3.070068359375, 3.3465576171875, 3.623046875, 3.8995361328125, 4.176025390625, 4.4525146484375, 4.72900390625, 5.0054931640625, 5.281982421875, 5.5584716796875, 5.8349609375, 6.1114501953125, 6.387939453125, 6.6644287109375, 6.94091796875, 7.2174072265625, 7.493896484375, 7.7703857421875, 8.046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 2.0, 4.0, 6.0, 8.0, 13.0, 9.0, 12.0, 11.0, 11.0, 25.0, 17.0, 40.0, 26.0, 31.0, 31.0, 32.0, 43.0, 50.0, 35.0, 54.0, 44.0, 44.0, 35.0, 39.0, 46.0, 37.0, 37.0, 44.0, 26.0, 21.0, 29.0, 24.0, 25.0, 14.0, 10.0, 9.0, 11.0, 9.0, 8.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-27.20257568359375, -26.402612686157227, -25.60264778137207, -24.802684783935547, -24.00271987915039, -23.202756881713867, -22.402793884277344, -21.602828979492188, -20.802865982055664, -20.00290298461914, -19.202938079833984, -18.40297508239746, -17.603012084960938, -16.80304718017578, -16.003084182739258, -15.203120231628418, -14.403156280517578, -13.603192329406738, -12.803228378295898, -12.003265380859375, -11.203301429748535, -10.403337478637695, -9.603374481201172, -8.803410530090332, -8.003446578979492, -7.203482627868652, -6.403519153594971, -5.603555679321289, -4.803591728210449, -4.003627777099609, -3.2036643028259277, -2.403700828552246, -1.6037349700927734, -0.8037712574005127, -0.003807544708251953, 0.7961561679840088, 1.5961198806762695, 2.3960835933685303, 3.196047306060791, 3.9960107803344727, 4.7959747314453125, 5.595938682556152, 6.395902156829834, 7.195865631103516, 7.9958295822143555, 8.795793533325195, 9.595756530761719, 10.395720481872559, 11.195684432983398, 11.995648384094238, 12.795612335205078, 13.595575332641602, 14.395539283752441, 15.195503234863281, 15.995466232299805, 16.795429229736328, 17.595394134521484, 18.395357131958008, 19.195322036743164, 19.995285034179688, 20.795249938964844, 21.595212936401367, 22.39517593383789, 23.195140838623047, 23.99510383605957]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 13.0, 15.0, 19.0, 20.0, 13.0, 20.0, 22.0, 27.0, 29.0, 21.0, 37.0, 32.0, 25.0, 45.0, 39.0, 37.0, 42.0, 54.0, 34.0, 49.0, 29.0, 35.0, 50.0, 22.0, 41.0, 29.0, 33.0, 25.0, 20.0, 18.0, 21.0, 13.0, 9.0, 9.0, 6.0, 7.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.329103469848633, -23.54814338684082, -22.76718521118164, -21.986225128173828, -21.205265045166016, -20.424304962158203, -19.64334487915039, -18.86238670349121, -18.0814266204834, -17.300466537475586, -16.519508361816406, -15.738548278808594, -14.957588195800781, -14.176628112792969, -13.395668983459473, -12.614709854125977, -11.833749771118164, -11.052789688110352, -10.271830558776855, -9.49087142944336, -8.709911346435547, -7.928951740264893, -7.147992134094238, -6.367032527923584, -5.58607292175293, -4.805113315582275, -4.024153709411621, -3.243194103240967, -2.4622344970703125, -1.6812748908996582, -0.9003152847290039, -0.11935567855834961, 0.6616039276123047, 1.442563533782959, 2.2235231399536133, 3.0044827461242676, 3.785442352294922, 4.566401958465576, 5.3473615646362305, 6.128321170806885, 6.909280776977539, 7.690240383148193, 8.471199989318848, 9.252159118652344, 10.033119201660156, 10.814079284667969, 11.595038414001465, 12.375997543334961, 13.156957626342773, 13.937917709350586, 14.718876838684082, 15.499835968017578, 16.28079605102539, 17.061756134033203, 17.842716217041016, 18.623674392700195, 19.404634475708008, 20.18559455871582, 20.966552734375, 21.747512817382812, 22.528472900390625, 23.309432983398438, 24.09039306640625, 24.87135124206543, 25.652311325073242]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [7.0, 3.0, 5.0, 4.0, 11.0, 9.0, 19.0, 20.0, 31.0, 42.0, 57.0, 73.0, 108.0, 180.0, 252.0, 356.0, 548.0, 862.0, 1295.0, 1939.0, 3033.0, 4801.0, 7691.0, 12189.0, 20041.0, 34276.0, 61134.0, 109712.0, 182394.0, 216846.0, 164497.0, 95131.0, 53089.0, 30385.0, 17733.0, 10708.0, 6793.0, 4167.0, 2784.0, 1798.0, 1204.0, 791.0, 500.0, 325.0, 236.0, 155.0, 103.0, 69.0, 46.0, 45.0, 17.0, 16.0, 13.0, 13.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-39.9375, -38.578125, -37.21875, -35.859375, -34.5, -33.140625, -31.78125, -30.421875, -29.0625, -27.703125, -26.34375, -24.984375, -23.625, -22.265625, -20.90625, -19.546875, -18.1875, -16.828125, -15.46875, -14.109375, -12.75, -11.390625, -10.03125, -8.671875, -7.3125, -5.953125, -4.59375, -3.234375, -1.875, -0.515625, 0.84375, 2.203125, 3.5625, 4.921875, 6.28125, 7.640625, 9.0, 10.359375, 11.71875, 13.078125, 14.4375, 15.796875, 17.15625, 18.515625, 19.875, 21.234375, 22.59375, 23.953125, 25.3125, 26.671875, 28.03125, 29.390625, 30.75, 32.109375, 33.46875, 34.828125, 36.1875, 37.546875, 38.90625, 40.265625, 41.625, 42.984375, 44.34375, 45.703125, 47.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 10.0, 7.0, 11.0, 4.0, 12.0, 8.0, 10.0, 23.0, 16.0, 20.0, 25.0, 21.0, 41.0, 20.0, 40.0, 35.0, 31.0, 38.0, 51.0, 32.0, 41.0, 47.0, 43.0, 33.0, 29.0, 36.0, 31.0, 31.0, 31.0, 24.0, 25.0, 33.0, 27.0, 10.0, 18.0, 16.0, 12.0, 13.0, 8.0, 7.0, 8.0, 4.0, 2.0, 1.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.28125, -22.5517578125, -21.822265625, -21.0927734375, -20.36328125, -19.6337890625, -18.904296875, -18.1748046875, -17.4453125, -16.7158203125, -15.986328125, -15.2568359375, -14.52734375, -13.7978515625, -13.068359375, -12.3388671875, -11.609375, -10.8798828125, -10.150390625, -9.4208984375, -8.69140625, -7.9619140625, -7.232421875, -6.5029296875, -5.7734375, -5.0439453125, -4.314453125, -3.5849609375, -2.85546875, -2.1259765625, -1.396484375, -0.6669921875, 0.0625, 0.7919921875, 1.521484375, 2.2509765625, 2.98046875, 3.7099609375, 4.439453125, 5.1689453125, 5.8984375, 6.6279296875, 7.357421875, 8.0869140625, 8.81640625, 9.5458984375, 10.275390625, 11.0048828125, 11.734375, 12.4638671875, 13.193359375, 13.9228515625, 14.65234375, 15.3818359375, 16.111328125, 16.8408203125, 17.5703125, 18.2998046875, 19.029296875, 19.7587890625, 20.48828125, 21.2177734375, 21.947265625, 22.6767578125, 23.40625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 11.0, 16.0, 10.0, 14.0, 20.0, 27.0, 45.0, 70.0, 94.0, 166.0, 259.0, 366.0, 515.0, 792.0, 1168.0, 1755.0, 2731.0, 4096.0, 6161.0, 9539.0, 14999.0, 23615.0, 39375.0, 69151.0, 126797.0, 209494.0, 215275.0, 136141.0, 73775.0, 41694.0, 25231.0, 15674.0, 10120.0, 6570.0, 4409.0, 2799.0, 1862.0, 1247.0, 762.0, 564.0, 377.0, 257.0, 175.0, 101.0, 84.0, 57.0, 35.0, 23.0, 16.0, 15.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-44.40625, -42.9765625, -41.546875, -40.1171875, -38.6875, -37.2578125, -35.828125, -34.3984375, -32.96875, -31.5390625, -30.109375, -28.6796875, -27.25, -25.8203125, -24.390625, -22.9609375, -21.53125, -20.1015625, -18.671875, -17.2421875, -15.8125, -14.3828125, -12.953125, -11.5234375, -10.09375, -8.6640625, -7.234375, -5.8046875, -4.375, -2.9453125, -1.515625, -0.0859375, 1.34375, 2.7734375, 4.203125, 5.6328125, 7.0625, 8.4921875, 9.921875, 11.3515625, 12.78125, 14.2109375, 15.640625, 17.0703125, 18.5, 19.9296875, 21.359375, 22.7890625, 24.21875, 25.6484375, 27.078125, 28.5078125, 29.9375, 31.3671875, 32.796875, 34.2265625, 35.65625, 37.0859375, 38.515625, 39.9453125, 41.375, 42.8046875, 44.234375, 45.6640625, 47.09375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 8.0, 5.0, 9.0, 4.0, 10.0, 7.0, 10.0, 9.0, 14.0, 17.0, 20.0, 23.0, 32.0, 29.0, 26.0, 36.0, 35.0, 44.0, 41.0, 37.0, 43.0, 45.0, 44.0, 43.0, 32.0, 40.0, 34.0, 40.0, 33.0, 27.0, 32.0, 26.0, 21.0, 17.0, 13.0, 12.0, 16.0, 12.0, 14.0, 10.0, 6.0, 5.0, 8.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-17.5, -16.9837646484375, -16.467529296875, -15.9512939453125, -15.43505859375, -14.9188232421875, -14.402587890625, -13.8863525390625, -13.3701171875, -12.8538818359375, -12.337646484375, -11.8214111328125, -11.30517578125, -10.7889404296875, -10.272705078125, -9.7564697265625, -9.240234375, -8.7239990234375, -8.207763671875, -7.6915283203125, -7.17529296875, -6.6590576171875, -6.142822265625, -5.6265869140625, -5.1103515625, -4.5941162109375, -4.077880859375, -3.5616455078125, -3.04541015625, -2.5291748046875, -2.012939453125, -1.4967041015625, -0.98046875, -0.4642333984375, 0.052001953125, 0.5682373046875, 1.08447265625, 1.6007080078125, 2.116943359375, 2.6331787109375, 3.1494140625, 3.6656494140625, 4.181884765625, 4.6981201171875, 5.21435546875, 5.7305908203125, 6.246826171875, 6.7630615234375, 7.279296875, 7.7955322265625, 8.311767578125, 8.8280029296875, 9.34423828125, 9.8604736328125, 10.376708984375, 10.8929443359375, 11.4091796875, 11.9254150390625, 12.441650390625, 12.9578857421875, 13.47412109375, 13.9903564453125, 14.506591796875, 15.0228271484375, 15.5390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 3.0, 11.0, 6.0, 9.0, 20.0, 18.0, 25.0, 39.0, 43.0, 57.0, 63.0, 86.0, 120.0, 147.0, 213.0, 299.0, 448.0, 619.0, 880.0, 1270.0, 1864.0, 2960.0, 4725.0, 7527.0, 13001.0, 23131.0, 42606.0, 81659.0, 154316.0, 232670.0, 210323.0, 123709.0, 64563.0, 33501.0, 18558.0, 10656.0, 6440.0, 3914.0, 2571.0, 1620.0, 1127.0, 761.0, 569.0, 387.0, 307.0, 181.0, 117.0, 105.0, 86.0, 52.0, 57.0, 30.0, 20.0, 23.0, 14.0, 9.0, 12.0, 5.0, 6.0, 5.0, 3.0], "bins": [-18.8125, -18.2392578125, -17.666015625, -17.0927734375, -16.51953125, -15.9462890625, -15.373046875, -14.7998046875, -14.2265625, -13.6533203125, -13.080078125, -12.5068359375, -11.93359375, -11.3603515625, -10.787109375, -10.2138671875, -9.640625, -9.0673828125, -8.494140625, -7.9208984375, -7.34765625, -6.7744140625, -6.201171875, -5.6279296875, -5.0546875, -4.4814453125, -3.908203125, -3.3349609375, -2.76171875, -2.1884765625, -1.615234375, -1.0419921875, -0.46875, 0.1044921875, 0.677734375, 1.2509765625, 1.82421875, 2.3974609375, 2.970703125, 3.5439453125, 4.1171875, 4.6904296875, 5.263671875, 5.8369140625, 6.41015625, 6.9833984375, 7.556640625, 8.1298828125, 8.703125, 9.2763671875, 9.849609375, 10.4228515625, 10.99609375, 11.5693359375, 12.142578125, 12.7158203125, 13.2890625, 13.8623046875, 14.435546875, 15.0087890625, 15.58203125, 16.1552734375, 16.728515625, 17.3017578125, 17.875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 17.0, 16.0, 28.0, 48.0, 56.0, 130.0, 146.0, 157.0, 129.0, 82.0, 56.0, 27.0, 29.0, 16.0, 9.0, 8.0, 2.0, 8.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002162933349609375, -0.002069026231765747, -0.001975119113922119, -0.0018812119960784912, -0.0017873048782348633, -0.0016933977603912354, -0.0015994906425476074, -0.0015055835247039795, -0.0014116764068603516, -0.0013177692890167236, -0.0012238621711730957, -0.0011299550533294678, -0.0010360479354858398, -0.0009421408176422119, -0.000848233699798584, -0.0007543265819549561, -0.0006604194641113281, -0.0005665123462677002, -0.00047260522842407227, -0.00037869811058044434, -0.0002847909927368164, -0.00019088387489318848, -9.697675704956055e-05, -3.069639205932617e-06, 9.083747863769531e-05, 0.00018474459648132324, 0.00027865171432495117, 0.0003725588321685791, 0.00046646595001220703, 0.000560373067855835, 0.0006542801856994629, 0.0007481873035430908, 0.0008420944213867188, 0.0009360015392303467, 0.0010299086570739746, 0.0011238157749176025, 0.0012177228927612305, 0.0013116300106048584, 0.0014055371284484863, 0.0014994442462921143, 0.0015933513641357422, 0.0016872584819793701, 0.001781165599822998, 0.001875072717666626, 0.001968979835510254, 0.002062886953353882, 0.0021567940711975098, 0.0022507011890411377, 0.0023446083068847656, 0.0024385154247283936, 0.0025324225425720215, 0.0026263296604156494, 0.0027202367782592773, 0.0028141438961029053, 0.002908051013946533, 0.003001958131790161, 0.003095865249633789, 0.003189772367477417, 0.003283679485321045, 0.003377586603164673, 0.0034714937210083008, 0.0035654008388519287, 0.0036593079566955566, 0.0037532150745391846, 0.0038471221923828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 11.0, 10.0, 15.0, 18.0, 23.0, 40.0, 65.0, 69.0, 127.0, 183.0, 250.0, 411.0, 594.0, 1012.0, 1447.0, 2134.0, 3466.0, 5529.0, 8975.0, 14538.0, 23166.0, 37613.0, 58615.0, 86660.0, 118968.0, 144049.0, 146199.0, 125335.0, 94547.0, 64000.0, 41586.0, 26048.0, 15998.0, 9779.0, 6247.0, 3681.0, 2445.0, 1594.0, 1037.0, 697.0, 468.0, 312.0, 173.0, 136.0, 107.0, 61.0, 39.0, 34.0, 19.0, 8.0, 12.0, 7.0, 3.0, 1.0, 4.0, 4.0], "bins": [-13.5703125, -13.1724853515625, -12.774658203125, -12.3768310546875, -11.97900390625, -11.5811767578125, -11.183349609375, -10.7855224609375, -10.3876953125, -9.9898681640625, -9.592041015625, -9.1942138671875, -8.79638671875, -8.3985595703125, -8.000732421875, -7.6029052734375, -7.205078125, -6.8072509765625, -6.409423828125, -6.0115966796875, -5.61376953125, -5.2159423828125, -4.818115234375, -4.4202880859375, -4.0224609375, -3.6246337890625, -3.226806640625, -2.8289794921875, -2.43115234375, -2.0333251953125, -1.635498046875, -1.2376708984375, -0.83984375, -0.4420166015625, -0.044189453125, 0.3536376953125, 0.75146484375, 1.1492919921875, 1.547119140625, 1.9449462890625, 2.3427734375, 2.7406005859375, 3.138427734375, 3.5362548828125, 3.93408203125, 4.3319091796875, 4.729736328125, 5.1275634765625, 5.525390625, 5.9232177734375, 6.321044921875, 6.7188720703125, 7.11669921875, 7.5145263671875, 7.912353515625, 8.3101806640625, 8.7080078125, 9.1058349609375, 9.503662109375, 9.9014892578125, 10.29931640625, 10.6971435546875, 11.094970703125, 11.4927978515625, 11.890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 5.0, 5.0, 5.0, 5.0, 8.0, 9.0, 10.0, 15.0, 19.0, 16.0, 23.0, 24.0, 29.0, 41.0, 40.0, 55.0, 65.0, 45.0, 56.0, 52.0, 58.0, 57.0, 53.0, 41.0, 45.0, 35.0, 37.0, 39.0, 27.0, 21.0, 13.0, 15.0, 8.0, 5.0, 8.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6328125, -5.44964599609375, -5.2664794921875, -5.08331298828125, -4.900146484375, -4.71697998046875, -4.5338134765625, -4.35064697265625, -4.16748046875, -3.98431396484375, -3.8011474609375, -3.61798095703125, -3.434814453125, -3.25164794921875, -3.0684814453125, -2.88531494140625, -2.7021484375, -2.51898193359375, -2.3358154296875, -2.15264892578125, -1.969482421875, -1.78631591796875, -1.6031494140625, -1.41998291015625, -1.23681640625, -1.05364990234375, -0.8704833984375, -0.68731689453125, -0.504150390625, -0.32098388671875, -0.1378173828125, 0.04534912109375, 0.228515625, 0.41168212890625, 0.5948486328125, 0.77801513671875, 0.961181640625, 1.14434814453125, 1.3275146484375, 1.51068115234375, 1.69384765625, 1.87701416015625, 2.0601806640625, 2.24334716796875, 2.426513671875, 2.60968017578125, 2.7928466796875, 2.97601318359375, 3.1591796875, 3.34234619140625, 3.5255126953125, 3.70867919921875, 3.891845703125, 4.07501220703125, 4.2581787109375, 4.44134521484375, 4.62451171875, 4.80767822265625, 4.9908447265625, 5.17401123046875, 5.357177734375, 5.54034423828125, 5.7235107421875, 5.90667724609375, 6.08984375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 8.0, 10.0, 10.0, 7.0, 16.0, 12.0, 17.0, 18.0, 22.0, 21.0, 32.0, 19.0, 36.0, 43.0, 37.0, 38.0, 36.0, 32.0, 53.0, 43.0, 41.0, 42.0, 41.0, 41.0, 33.0, 45.0, 33.0, 28.0, 25.0, 35.0, 22.0, 19.0, 19.0, 7.0, 14.0, 8.0, 7.0, 8.0, 2.0, 3.0, 6.0, 2.0, 6.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.85923194885254, -22.121984481811523, -21.384735107421875, -20.64748764038086, -19.91023826599121, -19.172990798950195, -18.435741424560547, -17.69849395751953, -16.961244583129883, -16.223997116088867, -15.486747741699219, -14.749499320983887, -14.012250900268555, -13.275002479553223, -12.53775405883789, -11.800506591796875, -11.063258171081543, -10.326009750366211, -9.588761329650879, -8.851512908935547, -8.114264488220215, -7.377016067504883, -6.639768123626709, -5.902519702911377, -5.165271282196045, -4.428022861480713, -3.690774440765381, -2.953526258468628, -2.216277837753296, -1.4790294170379639, -0.7417812347412109, -0.004532814025878906, 0.7327156066894531, 1.4699640274047852, 2.207212448120117, 2.94446063041687, 3.681709051132202, 4.418957710266113, 5.156205654144287, 5.893454074859619, 6.630702495574951, 7.367950916290283, 8.105198860168457, 8.842447280883789, 9.579695701599121, 10.316944122314453, 11.054192543029785, 11.791440963745117, 12.52868938446045, 13.265937805175781, 14.003186225891113, 14.740434646606445, 15.477683067321777, 16.21493148803711, 16.952178955078125, 17.689428329467773, 18.42667579650879, 19.163923263549805, 19.901172637939453, 20.63842010498047, 21.375669479370117, 22.112916946411133, 22.85016632080078, 23.587413787841797, 24.324663162231445]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 7.0, 12.0, 13.0, 16.0, 17.0, 19.0, 20.0, 24.0, 30.0, 21.0, 28.0, 37.0, 36.0, 29.0, 34.0, 43.0, 41.0, 49.0, 39.0, 46.0, 40.0, 35.0, 37.0, 40.0, 41.0, 26.0, 42.0, 24.0, 28.0, 20.0, 22.0, 16.0, 18.0, 5.0, 6.0, 8.0, 5.0, 6.0, 7.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.105548858642578, -22.346323013305664, -21.587095260620117, -20.827869415283203, -20.06864356994629, -19.309417724609375, -18.550189971923828, -17.790964126586914, -17.03173828125, -16.272512435913086, -15.513285636901855, -14.754058837890625, -13.994832992553711, -13.23560619354248, -12.47637939453125, -11.717153549194336, -10.957925796508789, -10.198698997497559, -9.439473152160645, -8.680246353149414, -7.921020030975342, -7.1617937088012695, -6.402566909790039, -5.643340587615967, -4.8841142654418945, -4.124887943267822, -3.365661382675171, -2.6064348220825195, -1.8472084999084473, -1.087982177734375, -0.32875537872314453, 0.43047094345092773, 1.1896953582763672, 1.948921799659729, 2.708148241043091, 3.467374801635742, 4.2266011238098145, 4.985827445983887, 5.745054244995117, 6.5042805671691895, 7.263506889343262, 8.022733688354492, 8.781959533691406, 9.541186332702637, 10.300413131713867, 11.059638977050781, 11.818865776062012, 12.578092575073242, 13.337318420410156, 14.096545219421387, 14.8557710647583, 15.614997863769531, 16.374223709106445, 17.13344955444336, 17.892677307128906, 18.65190315246582, 19.411128997802734, 20.17035484313965, 20.929582595825195, 21.68880844116211, 22.448034286499023, 23.207260131835938, 23.966487884521484, 24.7257137298584, 25.484941482543945]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 7.0, 12.0, 13.0, 28.0, 26.0, 56.0, 81.0, 113.0, 189.0, 313.0, 459.0, 718.0, 1211.0, 1812.0, 2888.0, 4438.0, 6930.0, 10713.0, 16073.0, 23439.0, 33893.0, 46363.0, 62971.0, 79695.0, 95225.0, 105823.0, 107891.0, 101915.0, 88455.0, 72586.0, 55877.0, 40915.0, 29145.0, 19957.0, 13401.0, 8728.0, 5836.0, 3780.0, 2365.0, 1515.0, 997.0, 611.0, 360.0, 261.0, 177.0, 106.0, 68.0, 48.0, 31.0, 15.0, 16.0, 12.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.296875, -15.7587890625, -15.220703125, -14.6826171875, -14.14453125, -13.6064453125, -13.068359375, -12.5302734375, -11.9921875, -11.4541015625, -10.916015625, -10.3779296875, -9.83984375, -9.3017578125, -8.763671875, -8.2255859375, -7.6875, -7.1494140625, -6.611328125, -6.0732421875, -5.53515625, -4.9970703125, -4.458984375, -3.9208984375, -3.3828125, -2.8447265625, -2.306640625, -1.7685546875, -1.23046875, -0.6923828125, -0.154296875, 0.3837890625, 0.921875, 1.4599609375, 1.998046875, 2.5361328125, 3.07421875, 3.6123046875, 4.150390625, 4.6884765625, 5.2265625, 5.7646484375, 6.302734375, 6.8408203125, 7.37890625, 7.9169921875, 8.455078125, 8.9931640625, 9.53125, 10.0693359375, 10.607421875, 11.1455078125, 11.68359375, 12.2216796875, 12.759765625, 13.2978515625, 13.8359375, 14.3740234375, 14.912109375, 15.4501953125, 15.98828125, 16.5263671875, 17.064453125, 17.6025390625, 18.140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 7.0, 3.0, 6.0, 9.0, 9.0, 10.0, 19.0, 19.0, 7.0, 16.0, 25.0, 26.0, 15.0, 31.0, 23.0, 40.0, 39.0, 44.0, 32.0, 30.0, 33.0, 44.0, 33.0, 50.0, 36.0, 22.0, 24.0, 44.0, 48.0, 39.0, 20.0, 28.0, 26.0, 19.0, 18.0, 21.0, 13.0, 11.0, 15.0, 8.0, 8.0, 10.0, 5.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-21.46875, -20.787109375, -20.10546875, -19.423828125, -18.7421875, -18.060546875, -17.37890625, -16.697265625, -16.015625, -15.333984375, -14.65234375, -13.970703125, -13.2890625, -12.607421875, -11.92578125, -11.244140625, -10.5625, -9.880859375, -9.19921875, -8.517578125, -7.8359375, -7.154296875, -6.47265625, -5.791015625, -5.109375, -4.427734375, -3.74609375, -3.064453125, -2.3828125, -1.701171875, -1.01953125, -0.337890625, 0.34375, 1.025390625, 1.70703125, 2.388671875, 3.0703125, 3.751953125, 4.43359375, 5.115234375, 5.796875, 6.478515625, 7.16015625, 7.841796875, 8.5234375, 9.205078125, 9.88671875, 10.568359375, 11.25, 11.931640625, 12.61328125, 13.294921875, 13.9765625, 14.658203125, 15.33984375, 16.021484375, 16.703125, 17.384765625, 18.06640625, 18.748046875, 19.4296875, 20.111328125, 20.79296875, 21.474609375, 22.15625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 13.0, 24.0, 38.0, 48.0, 70.0, 156.0, 218.0, 351.0, 605.0, 978.0, 1602.0, 2802.0, 4385.0, 7274.0, 12096.0, 19114.0, 29899.0, 45505.0, 65159.0, 87656.0, 109626.0, 123952.0, 124609.0, 113518.0, 92765.0, 69921.0, 48775.0, 32535.0, 21064.0, 13036.0, 8139.0, 5017.0, 2969.0, 1807.0, 1119.0, 650.0, 409.0, 265.0, 158.0, 85.0, 57.0, 26.0, 16.0, 14.0, 13.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.265625, -21.572021484375, -20.87841796875, -20.184814453125, -19.4912109375, -18.797607421875, -18.10400390625, -17.410400390625, -16.716796875, -16.023193359375, -15.32958984375, -14.635986328125, -13.9423828125, -13.248779296875, -12.55517578125, -11.861572265625, -11.16796875, -10.474365234375, -9.78076171875, -9.087158203125, -8.3935546875, -7.699951171875, -7.00634765625, -6.312744140625, -5.619140625, -4.925537109375, -4.23193359375, -3.538330078125, -2.8447265625, -2.151123046875, -1.45751953125, -0.763916015625, -0.0703125, 0.623291015625, 1.31689453125, 2.010498046875, 2.7041015625, 3.397705078125, 4.09130859375, 4.784912109375, 5.478515625, 6.172119140625, 6.86572265625, 7.559326171875, 8.2529296875, 8.946533203125, 9.64013671875, 10.333740234375, 11.02734375, 11.720947265625, 12.41455078125, 13.108154296875, 13.8017578125, 14.495361328125, 15.18896484375, 15.882568359375, 16.576171875, 17.269775390625, 17.96337890625, 18.656982421875, 19.3505859375, 20.044189453125, 20.73779296875, 21.431396484375, 22.125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 7.0, 5.0, 6.0, 7.0, 5.0, 14.0, 9.0, 9.0, 17.0, 20.0, 22.0, 24.0, 15.0, 23.0, 30.0, 28.0, 30.0, 32.0, 37.0, 39.0, 40.0, 40.0, 34.0, 34.0, 47.0, 39.0, 39.0, 39.0, 47.0, 29.0, 34.0, 23.0, 34.0, 23.0, 17.0, 13.0, 11.0, 10.0, 12.0, 12.0, 11.0, 14.0, 2.0, 3.0, 4.0, 1.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.5703125, -13.1170654296875, -12.663818359375, -12.2105712890625, -11.75732421875, -11.3040771484375, -10.850830078125, -10.3975830078125, -9.9443359375, -9.4910888671875, -9.037841796875, -8.5845947265625, -8.13134765625, -7.6781005859375, -7.224853515625, -6.7716064453125, -6.318359375, -5.8651123046875, -5.411865234375, -4.9586181640625, -4.50537109375, -4.0521240234375, -3.598876953125, -3.1456298828125, -2.6923828125, -2.2391357421875, -1.785888671875, -1.3326416015625, -0.87939453125, -0.4261474609375, 0.027099609375, 0.4803466796875, 0.93359375, 1.3868408203125, 1.840087890625, 2.2933349609375, 2.74658203125, 3.1998291015625, 3.653076171875, 4.1063232421875, 4.5595703125, 5.0128173828125, 5.466064453125, 5.9193115234375, 6.37255859375, 6.8258056640625, 7.279052734375, 7.7322998046875, 8.185546875, 8.6387939453125, 9.092041015625, 9.5452880859375, 9.99853515625, 10.4517822265625, 10.905029296875, 11.3582763671875, 11.8115234375, 12.2647705078125, 12.718017578125, 13.1712646484375, 13.62451171875, 14.0777587890625, 14.531005859375, 14.9842529296875, 15.4375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 14.0, 14.0, 41.0, 48.0, 47.0, 103.0, 161.0, 217.0, 362.0, 547.0, 896.0, 1416.0, 2377.0, 3864.0, 6530.0, 10873.0, 18535.0, 31636.0, 52702.0, 84133.0, 121639.0, 154434.0, 161013.0, 137766.0, 99337.0, 63874.0, 38970.0, 23269.0, 13335.0, 8096.0, 4770.0, 2815.0, 1761.0, 1056.0, 714.0, 420.0, 256.0, 179.0, 115.0, 74.0, 51.0, 40.0, 27.0, 12.0, 4.0, 4.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.75, -11.3961181640625, -11.042236328125, -10.6883544921875, -10.33447265625, -9.9805908203125, -9.626708984375, -9.2728271484375, -8.9189453125, -8.5650634765625, -8.211181640625, -7.8572998046875, -7.50341796875, -7.1495361328125, -6.795654296875, -6.4417724609375, -6.087890625, -5.7340087890625, -5.380126953125, -5.0262451171875, -4.67236328125, -4.3184814453125, -3.964599609375, -3.6107177734375, -3.2568359375, -2.9029541015625, -2.549072265625, -2.1951904296875, -1.84130859375, -1.4874267578125, -1.133544921875, -0.7796630859375, -0.42578125, -0.0718994140625, 0.281982421875, 0.6358642578125, 0.98974609375, 1.3436279296875, 1.697509765625, 2.0513916015625, 2.4052734375, 2.7591552734375, 3.113037109375, 3.4669189453125, 3.82080078125, 4.1746826171875, 4.528564453125, 4.8824462890625, 5.236328125, 5.5902099609375, 5.944091796875, 6.2979736328125, 6.65185546875, 7.0057373046875, 7.359619140625, 7.7135009765625, 8.0673828125, 8.4212646484375, 8.775146484375, 9.1290283203125, 9.48291015625, 9.8367919921875, 10.190673828125, 10.5445556640625, 10.8984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 9.0, 14.0, 14.0, 19.0, 23.0, 33.0, 30.0, 39.0, 55.0, 48.0, 37.0, 45.0, 58.0, 58.0, 59.0, 54.0, 56.0, 43.0, 44.0, 38.0, 38.0, 29.0, 25.0, 26.0, 22.0, 14.0, 15.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0013380050659179688, -0.0012992173433303833, -0.0012604296207427979, -0.0012216418981552124, -0.001182854175567627, -0.0011440664529800415, -0.001105278730392456, -0.0010664910078048706, -0.0010277032852172852, -0.0009889155626296997, -0.0009501278400421143, -0.0009113401174545288, -0.0008725523948669434, -0.0008337646722793579, -0.0007949769496917725, -0.000756189227104187, -0.0007174015045166016, -0.0006786137819290161, -0.0006398260593414307, -0.0006010383367538452, -0.0005622506141662598, -0.0005234628915786743, -0.00048467516899108887, -0.0004458874464035034, -0.00040709972381591797, -0.0003683120012283325, -0.00032952427864074707, -0.0002907365560531616, -0.00025194883346557617, -0.00021316111087799072, -0.00017437338829040527, -0.00013558566570281982, -9.679794311523438e-05, -5.8010220527648926e-05, -1.9222497940063477e-05, 1.9565224647521973e-05, 5.835294723510742e-05, 9.714066982269287e-05, 0.00013592839241027832, 0.00017471611499786377, 0.00021350383758544922, 0.00025229156017303467, 0.0002910792827606201, 0.00032986700534820557, 0.000368654727935791, 0.00040744245052337646, 0.0004462301731109619, 0.00048501789569854736, 0.0005238056182861328, 0.0005625933408737183, 0.0006013810634613037, 0.0006401687860488892, 0.0006789565086364746, 0.0007177442312240601, 0.0007565319538116455, 0.000795319676399231, 0.0008341073989868164, 0.0008728951215744019, 0.0009116828441619873, 0.0009504705667495728, 0.0009892582893371582, 0.0010280460119247437, 0.001066833734512329, 0.0011056214570999146, 0.0011444091796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 10.0, 11.0, 26.0, 29.0, 33.0, 42.0, 86.0, 139.0, 204.0, 317.0, 482.0, 853.0, 1323.0, 2366.0, 3808.0, 6448.0, 10776.0, 17910.0, 29129.0, 46797.0, 70743.0, 98910.0, 126711.0, 141479.0, 136309.0, 114335.0, 85071.0, 58143.0, 37791.0, 23077.0, 14068.0, 8374.0, 5172.0, 2973.0, 1790.0, 1067.0, 665.0, 392.0, 233.0, 163.0, 107.0, 54.0, 38.0, 28.0, 28.0, 19.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.265625, -8.973876953125, -8.68212890625, -8.390380859375, -8.0986328125, -7.806884765625, -7.51513671875, -7.223388671875, -6.931640625, -6.639892578125, -6.34814453125, -6.056396484375, -5.7646484375, -5.472900390625, -5.18115234375, -4.889404296875, -4.59765625, -4.305908203125, -4.01416015625, -3.722412109375, -3.4306640625, -3.138916015625, -2.84716796875, -2.555419921875, -2.263671875, -1.971923828125, -1.68017578125, -1.388427734375, -1.0966796875, -0.804931640625, -0.51318359375, -0.221435546875, 0.0703125, 0.362060546875, 0.65380859375, 0.945556640625, 1.2373046875, 1.529052734375, 1.82080078125, 2.112548828125, 2.404296875, 2.696044921875, 2.98779296875, 3.279541015625, 3.5712890625, 3.863037109375, 4.15478515625, 4.446533203125, 4.73828125, 5.030029296875, 5.32177734375, 5.613525390625, 5.9052734375, 6.197021484375, 6.48876953125, 6.780517578125, 7.072265625, 7.364013671875, 7.65576171875, 7.947509765625, 8.2392578125, 8.531005859375, 8.82275390625, 9.114501953125, 9.40625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 9.0, 10.0, 10.0, 8.0, 8.0, 24.0, 12.0, 23.0, 18.0, 27.0, 32.0, 37.0, 35.0, 38.0, 35.0, 56.0, 48.0, 54.0, 52.0, 45.0, 58.0, 46.0, 41.0, 41.0, 26.0, 38.0, 26.0, 31.0, 18.0, 18.0, 9.0, 12.0, 14.0, 12.0, 7.0, 3.0, 11.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.078125, -3.960205078125, -3.84228515625, -3.724365234375, -3.6064453125, -3.488525390625, -3.37060546875, -3.252685546875, -3.134765625, -3.016845703125, -2.89892578125, -2.781005859375, -2.6630859375, -2.545166015625, -2.42724609375, -2.309326171875, -2.19140625, -2.073486328125, -1.95556640625, -1.837646484375, -1.7197265625, -1.601806640625, -1.48388671875, -1.365966796875, -1.248046875, -1.130126953125, -1.01220703125, -0.894287109375, -0.7763671875, -0.658447265625, -0.54052734375, -0.422607421875, -0.3046875, -0.186767578125, -0.06884765625, 0.049072265625, 0.1669921875, 0.284912109375, 0.40283203125, 0.520751953125, 0.638671875, 0.756591796875, 0.87451171875, 0.992431640625, 1.1103515625, 1.228271484375, 1.34619140625, 1.464111328125, 1.58203125, 1.699951171875, 1.81787109375, 1.935791015625, 2.0537109375, 2.171630859375, 2.28955078125, 2.407470703125, 2.525390625, 2.643310546875, 2.76123046875, 2.879150390625, 2.9970703125, 3.114990234375, 3.23291015625, 3.350830078125, 3.46875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 11.0, 5.0, 13.0, 17.0, 17.0, 17.0, 20.0, 28.0, 20.0, 31.0, 25.0, 43.0, 41.0, 35.0, 53.0, 47.0, 48.0, 44.0, 40.0, 50.0, 46.0, 39.0, 32.0, 42.0, 27.0, 37.0, 35.0, 27.0, 18.0, 16.0, 15.0, 7.0, 14.0, 13.0, 5.0, 5.0, 0.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.80634307861328, -21.02112579345703, -20.23590850830078, -19.45069122314453, -18.66547393798828, -17.880258560180664, -17.095041275024414, -16.309823989868164, -15.524606704711914, -14.739389419555664, -13.954172134399414, -13.16895580291748, -12.38373851776123, -11.59852123260498, -10.813304901123047, -10.028087615966797, -9.242870330810547, -8.457653045654297, -7.672436237335205, -6.887219429016113, -6.102002143859863, -5.316784858703613, -4.5315680503845215, -3.7463512420654297, -2.9611339569091797, -2.175916910171509, -1.390699863433838, -0.605482816696167, 0.1797342300415039, 0.9649512767791748, 1.7501683235168457, 2.5353851318359375, 3.3206043243408203, 4.10582160949707, 4.891038417816162, 5.676255226135254, 6.461472511291504, 7.246689796447754, 8.031906127929688, 8.817123413085938, 9.602340698242188, 10.387557983398438, 11.172775268554688, 11.957991600036621, 12.743208885192871, 13.528426170349121, 14.313642501831055, 15.098859786987305, 15.884077072143555, 16.669294357299805, 17.454511642456055, 18.239728927612305, 19.024944305419922, 19.810161590576172, 20.595378875732422, 21.380596160888672, 22.165813446044922, 22.951030731201172, 23.736248016357422, 24.521465301513672, 25.306682586669922, 26.09189796447754, 26.87711524963379, 27.66233253479004, 28.44754981994629]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 13.0, 6.0, 16.0, 18.0, 10.0, 23.0, 22.0, 17.0, 30.0, 24.0, 38.0, 34.0, 36.0, 36.0, 38.0, 40.0, 40.0, 55.0, 38.0, 44.0, 41.0, 34.0, 37.0, 40.0, 47.0, 32.0, 23.0, 22.0, 20.0, 21.0, 21.0, 14.0, 12.0, 12.0, 9.0, 4.0, 5.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.896875381469727, -22.11444854736328, -21.332019805908203, -20.549592971801758, -19.767166137695312, -18.984737396240234, -18.20231056213379, -17.419883728027344, -16.637454986572266, -15.855027198791504, -15.072599411010742, -14.290172576904297, -13.507744789123535, -12.725317001342773, -11.942890167236328, -11.160462379455566, -10.378034591674805, -9.595606803894043, -8.813179016113281, -8.030752182006836, -7.248324394226074, -6.4658966064453125, -5.683469295501709, -4.9010419845581055, -4.118614196777344, -3.336186647415161, -2.5537590980529785, -1.771331548690796, -0.9889039993286133, -0.20647644996643066, 0.575951099395752, 1.3583784103393555, 2.14080810546875, 2.9232356548309326, 3.7056632041931152, 4.488090515136719, 5.2705183029174805, 6.052946090698242, 6.835373401641846, 7.617800712585449, 8.400228500366211, 9.182656288146973, 9.965084075927734, 10.74751091003418, 11.529938697814941, 12.312366485595703, 13.094793319702148, 13.87722110748291, 14.659648895263672, 15.442076683044434, 16.224504470825195, 17.00693130493164, 17.78936004638672, 18.571786880493164, 19.35421371459961, 20.136642456054688, 20.919069290161133, 21.701496124267578, 22.483924865722656, 23.2663516998291, 24.048778533935547, 24.831207275390625, 25.61363410949707, 26.396060943603516, 27.178489685058594]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 11.0, 12.0, 27.0, 33.0, 68.0, 94.0, 138.0, 244.0, 356.0, 520.0, 856.0, 1344.0, 2245.0, 3606.0, 5966.0, 9744.0, 16857.0, 28156.0, 49147.0, 84316.0, 145256.0, 245899.0, 386338.0, 540275.0, 644264.0, 630110.0, 511904.0, 352876.0, 220749.0, 130128.0, 74969.0, 42990.0, 25588.0, 15304.0, 9112.0, 5616.0, 3419.0, 2143.0, 1366.0, 846.0, 500.0, 314.0, 208.0, 135.0, 91.0, 66.0, 31.0, 16.0, 18.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.296875, -16.737060546875, -16.17724609375, -15.617431640625, -15.0576171875, -14.497802734375, -13.93798828125, -13.378173828125, -12.818359375, -12.258544921875, -11.69873046875, -11.138916015625, -10.5791015625, -10.019287109375, -9.45947265625, -8.899658203125, -8.33984375, -7.780029296875, -7.22021484375, -6.660400390625, -6.1005859375, -5.540771484375, -4.98095703125, -4.421142578125, -3.861328125, -3.301513671875, -2.74169921875, -2.181884765625, -1.6220703125, -1.062255859375, -0.50244140625, 0.057373046875, 0.6171875, 1.177001953125, 1.73681640625, 2.296630859375, 2.8564453125, 3.416259765625, 3.97607421875, 4.535888671875, 5.095703125, 5.655517578125, 6.21533203125, 6.775146484375, 7.3349609375, 7.894775390625, 8.45458984375, 9.014404296875, 9.57421875, 10.134033203125, 10.69384765625, 11.253662109375, 11.8134765625, 12.373291015625, 12.93310546875, 13.492919921875, 14.052734375, 14.612548828125, 15.17236328125, 15.732177734375, 16.2919921875, 16.851806640625, 17.41162109375, 17.971435546875, 18.53125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 8.0, 2.0, 5.0, 6.0, 6.0, 14.0, 15.0, 17.0, 16.0, 22.0, 16.0, 21.0, 29.0, 33.0, 36.0, 42.0, 42.0, 37.0, 40.0, 48.0, 42.0, 38.0, 47.0, 41.0, 46.0, 39.0, 40.0, 43.0, 34.0, 25.0, 12.0, 22.0, 21.0, 22.0, 15.0, 2.0, 16.0, 14.0, 7.0, 5.0, 8.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.40625, -19.733154296875, -19.06005859375, -18.386962890625, -17.7138671875, -17.040771484375, -16.36767578125, -15.694580078125, -15.021484375, -14.348388671875, -13.67529296875, -13.002197265625, -12.3291015625, -11.656005859375, -10.98291015625, -10.309814453125, -9.63671875, -8.963623046875, -8.29052734375, -7.617431640625, -6.9443359375, -6.271240234375, -5.59814453125, -4.925048828125, -4.251953125, -3.578857421875, -2.90576171875, -2.232666015625, -1.5595703125, -0.886474609375, -0.21337890625, 0.459716796875, 1.1328125, 1.805908203125, 2.47900390625, 3.152099609375, 3.8251953125, 4.498291015625, 5.17138671875, 5.844482421875, 6.517578125, 7.190673828125, 7.86376953125, 8.536865234375, 9.2099609375, 9.883056640625, 10.55615234375, 11.229248046875, 11.90234375, 12.575439453125, 13.24853515625, 13.921630859375, 14.5947265625, 15.267822265625, 15.94091796875, 16.614013671875, 17.287109375, 17.960205078125, 18.63330078125, 19.306396484375, 19.9794921875, 20.652587890625, 21.32568359375, 21.998779296875, 22.671875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 7.0, 15.0, 20.0, 41.0, 78.0, 148.0, 250.0, 526.0, 1060.0, 2171.0, 4316.0, 8876.0, 18822.0, 38680.0, 80748.0, 162258.0, 312285.0, 543674.0, 781145.0, 826575.0, 629516.0, 381933.0, 204177.0, 101348.0, 49509.0, 24036.0, 11338.0, 5357.0, 2717.0, 1324.0, 635.0, 318.0, 177.0, 92.0, 46.0, 23.0, 16.0, 8.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.34375, -25.470458984375, -24.59716796875, -23.723876953125, -22.8505859375, -21.977294921875, -21.10400390625, -20.230712890625, -19.357421875, -18.484130859375, -17.61083984375, -16.737548828125, -15.8642578125, -14.990966796875, -14.11767578125, -13.244384765625, -12.37109375, -11.497802734375, -10.62451171875, -9.751220703125, -8.8779296875, -8.004638671875, -7.13134765625, -6.258056640625, -5.384765625, -4.511474609375, -3.63818359375, -2.764892578125, -1.8916015625, -1.018310546875, -0.14501953125, 0.728271484375, 1.6015625, 2.474853515625, 3.34814453125, 4.221435546875, 5.0947265625, 5.968017578125, 6.84130859375, 7.714599609375, 8.587890625, 9.461181640625, 10.33447265625, 11.207763671875, 12.0810546875, 12.954345703125, 13.82763671875, 14.700927734375, 15.57421875, 16.447509765625, 17.32080078125, 18.194091796875, 19.0673828125, 19.940673828125, 20.81396484375, 21.687255859375, 22.560546875, 23.433837890625, 24.30712890625, 25.180419921875, 26.0537109375, 26.927001953125, 27.80029296875, 28.673583984375, 29.546875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 5.0, 7.0, 11.0, 13.0, 10.0, 17.0, 22.0, 26.0, 37.0, 48.0, 57.0, 53.0, 81.0, 101.0, 138.0, 117.0, 144.0, 167.0, 165.0, 179.0, 218.0, 215.0, 225.0, 208.0, 220.0, 204.0, 185.0, 153.0, 140.0, 140.0, 127.0, 126.0, 104.0, 77.0, 66.0, 51.0, 53.0, 33.0, 28.0, 30.0, 21.0, 14.0, 8.0, 5.0, 5.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-8.328125, -8.0731201171875, -7.818115234375, -7.5631103515625, -7.30810546875, -7.0531005859375, -6.798095703125, -6.5430908203125, -6.2880859375, -6.0330810546875, -5.778076171875, -5.5230712890625, -5.26806640625, -5.0130615234375, -4.758056640625, -4.5030517578125, -4.248046875, -3.9930419921875, -3.738037109375, -3.4830322265625, -3.22802734375, -2.9730224609375, -2.718017578125, -2.4630126953125, -2.2080078125, -1.9530029296875, -1.697998046875, -1.4429931640625, -1.18798828125, -0.9329833984375, -0.677978515625, -0.4229736328125, -0.16796875, 0.0870361328125, 0.342041015625, 0.5970458984375, 0.85205078125, 1.1070556640625, 1.362060546875, 1.6170654296875, 1.8720703125, 2.1270751953125, 2.382080078125, 2.6370849609375, 2.89208984375, 3.1470947265625, 3.402099609375, 3.6571044921875, 3.912109375, 4.1671142578125, 4.422119140625, 4.6771240234375, 4.93212890625, 5.1871337890625, 5.442138671875, 5.6971435546875, 5.9521484375, 6.2071533203125, 6.462158203125, 6.7171630859375, 6.97216796875, 7.2271728515625, 7.482177734375, 7.7371826171875, 7.9921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 9.0, 7.0, 5.0, 10.0, 14.0, 13.0, 16.0, 16.0, 22.0, 19.0, 26.0, 28.0, 33.0, 29.0, 36.0, 39.0, 48.0, 44.0, 46.0, 51.0, 44.0, 36.0, 43.0, 42.0, 31.0, 33.0, 40.0, 25.0, 28.0, 32.0, 21.0, 20.0, 19.0, 20.0, 12.0, 5.0, 11.0, 6.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.309255599975586, -18.591999053955078, -17.87474250793457, -17.157485961914062, -16.440229415893555, -15.722972869873047, -15.005716323852539, -14.288459777832031, -13.571203231811523, -12.853946685791016, -12.136690139770508, -11.41943359375, -10.702177047729492, -9.984920501708984, -9.267663955688477, -8.550407409667969, -7.833150863647461, -7.115894317626953, -6.398637771606445, -5.6813812255859375, -4.96412467956543, -4.246868133544922, -3.529611587524414, -2.8123550415039062, -2.0950984954833984, -1.3778419494628906, -0.6605854034423828, 0.056671142578125, 0.7739276885986328, 1.4911842346191406, 2.2084407806396484, 2.9256973266601562, 3.642953872680664, 4.360210418701172, 5.07746696472168, 5.7947235107421875, 6.511980056762695, 7.229236602783203, 7.946493148803711, 8.663749694824219, 9.381006240844727, 10.098262786865234, 10.815519332885742, 11.53277587890625, 12.250032424926758, 12.967288970947266, 13.684545516967773, 14.401802062988281, 15.119058609008789, 15.836315155029297, 16.553571701049805, 17.270828247070312, 17.98808479309082, 18.705341339111328, 19.422597885131836, 20.139854431152344, 20.85711097717285, 21.57436752319336, 22.291624069213867, 23.008880615234375, 23.726137161254883, 24.44339370727539, 25.1606502532959, 25.877906799316406, 26.595163345336914]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 5.0, 4.0, 6.0, 8.0, 2.0, 17.0, 9.0, 17.0, 23.0, 27.0, 20.0, 26.0, 22.0, 23.0, 23.0, 23.0, 34.0, 38.0, 34.0, 50.0, 44.0, 42.0, 51.0, 44.0, 45.0, 30.0, 29.0, 35.0, 23.0, 34.0, 22.0, 31.0, 22.0, 23.0, 18.0, 16.0, 15.0, 8.0, 10.0, 12.0, 6.0, 9.0, 7.0, 4.0, 1.0, 7.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.487255096435547, -21.808433532714844, -21.12961196899414, -20.45079231262207, -19.771970748901367, -19.093149185180664, -18.414329528808594, -17.73550796508789, -17.056686401367188, -16.377864837646484, -15.699044227600098, -15.020223617553711, -14.341402053833008, -13.662580490112305, -12.983759880065918, -12.304939270019531, -11.626117706298828, -10.947296142578125, -10.268475532531738, -9.589654922485352, -8.910833358764648, -8.232011795043945, -7.553191184997559, -6.874370098114014, -6.195549011230469, -5.516727924346924, -4.837906837463379, -4.159085750579834, -3.480264663696289, -2.801443576812744, -2.122622489929199, -1.4438014030456543, -0.7649784088134766, -0.08615732192993164, 0.5926637649536133, 1.2714848518371582, 1.9503059387207031, 2.629127025604248, 3.307948112487793, 3.986769199371338, 4.665590286254883, 5.344411373138428, 6.023232460021973, 6.702053546905518, 7.3808746337890625, 8.059696197509766, 8.738516807556152, 9.417337417602539, 10.096158981323242, 10.774980545043945, 11.453801155090332, 12.132621765136719, 12.811443328857422, 13.490264892578125, 14.169085502624512, 14.847906112670898, 15.526727676391602, 16.205549240112305, 16.884368896484375, 17.563190460205078, 18.24201202392578, 18.920833587646484, 19.599655151367188, 20.278474807739258, 20.95729637145996]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 8.0, 9.0, 11.0, 14.0, 15.0, 32.0, 37.0, 56.0, 91.0, 129.0, 161.0, 316.0, 443.0, 684.0, 959.0, 1469.0, 2210.0, 3355.0, 4946.0, 7741.0, 12306.0, 21076.0, 39832.0, 80800.0, 160083.0, 242061.0, 213414.0, 121339.0, 59052.0, 30175.0, 16835.0, 10031.0, 6398.0, 4097.0, 2768.0, 1910.0, 1187.0, 851.0, 550.0, 366.0, 256.0, 167.0, 109.0, 68.0, 51.0, 36.0, 17.0, 22.0, 8.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.54736328125, -31.3759765625, -30.20458984375, -29.033203125, -27.86181640625, -26.6904296875, -25.51904296875, -24.34765625, -23.17626953125, -22.0048828125, -20.83349609375, -19.662109375, -18.49072265625, -17.3193359375, -16.14794921875, -14.9765625, -13.80517578125, -12.6337890625, -11.46240234375, -10.291015625, -9.11962890625, -7.9482421875, -6.77685546875, -5.60546875, -4.43408203125, -3.2626953125, -2.09130859375, -0.919921875, 0.25146484375, 1.4228515625, 2.59423828125, 3.765625, 4.93701171875, 6.1083984375, 7.27978515625, 8.451171875, 9.62255859375, 10.7939453125, 11.96533203125, 13.13671875, 14.30810546875, 15.4794921875, 16.65087890625, 17.822265625, 18.99365234375, 20.1650390625, 21.33642578125, 22.5078125, 23.67919921875, 24.8505859375, 26.02197265625, 27.193359375, 28.36474609375, 29.5361328125, 30.70751953125, 31.87890625, 33.05029296875, 34.2216796875, 35.39306640625, 36.564453125, 37.73583984375, 38.9072265625, 40.07861328125, 41.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 10.0, 8.0, 5.0, 5.0, 21.0, 13.0, 5.0, 25.0, 23.0, 26.0, 28.0, 29.0, 33.0, 25.0, 27.0, 37.0, 40.0, 50.0, 41.0, 40.0, 42.0, 47.0, 52.0, 28.0, 39.0, 29.0, 27.0, 32.0, 27.0, 27.0, 27.0, 24.0, 18.0, 16.0, 13.0, 9.0, 8.0, 11.0, 8.0, 7.0, 5.0, 4.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-23.8125, -23.116455078125, -22.42041015625, -21.724365234375, -21.0283203125, -20.332275390625, -19.63623046875, -18.940185546875, -18.244140625, -17.548095703125, -16.85205078125, -16.156005859375, -15.4599609375, -14.763916015625, -14.06787109375, -13.371826171875, -12.67578125, -11.979736328125, -11.28369140625, -10.587646484375, -9.8916015625, -9.195556640625, -8.49951171875, -7.803466796875, -7.107421875, -6.411376953125, -5.71533203125, -5.019287109375, -4.3232421875, -3.627197265625, -2.93115234375, -2.235107421875, -1.5390625, -0.843017578125, -0.14697265625, 0.549072265625, 1.2451171875, 1.941162109375, 2.63720703125, 3.333251953125, 4.029296875, 4.725341796875, 5.42138671875, 6.117431640625, 6.8134765625, 7.509521484375, 8.20556640625, 8.901611328125, 9.59765625, 10.293701171875, 10.98974609375, 11.685791015625, 12.3818359375, 13.077880859375, 13.77392578125, 14.469970703125, 15.166015625, 15.862060546875, 16.55810546875, 17.254150390625, 17.9501953125, 18.646240234375, 19.34228515625, 20.038330078125, 20.734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 6.0, 27.0, 30.0, 43.0, 73.0, 95.0, 144.0, 217.0, 331.0, 498.0, 717.0, 1076.0, 1594.0, 2352.0, 3640.0, 5269.0, 8286.0, 12868.0, 20117.0, 33737.0, 58812.0, 106365.0, 178647.0, 219284.0, 164027.0, 94540.0, 52524.0, 30738.0, 18359.0, 11636.0, 7590.0, 4897.0, 3349.0, 2183.0, 1516.0, 1001.0, 678.0, 436.0, 271.0, 180.0, 150.0, 86.0, 49.0, 30.0, 25.0, 26.0, 13.0, 4.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-32.03125, -30.9775390625, -29.923828125, -28.8701171875, -27.81640625, -26.7626953125, -25.708984375, -24.6552734375, -23.6015625, -22.5478515625, -21.494140625, -20.4404296875, -19.38671875, -18.3330078125, -17.279296875, -16.2255859375, -15.171875, -14.1181640625, -13.064453125, -12.0107421875, -10.95703125, -9.9033203125, -8.849609375, -7.7958984375, -6.7421875, -5.6884765625, -4.634765625, -3.5810546875, -2.52734375, -1.4736328125, -0.419921875, 0.6337890625, 1.6875, 2.7412109375, 3.794921875, 4.8486328125, 5.90234375, 6.9560546875, 8.009765625, 9.0634765625, 10.1171875, 11.1708984375, 12.224609375, 13.2783203125, 14.33203125, 15.3857421875, 16.439453125, 17.4931640625, 18.546875, 19.6005859375, 20.654296875, 21.7080078125, 22.76171875, 23.8154296875, 24.869140625, 25.9228515625, 26.9765625, 28.0302734375, 29.083984375, 30.1376953125, 31.19140625, 32.2451171875, 33.298828125, 34.3525390625, 35.40625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 5.0, 3.0, 9.0, 20.0, 17.0, 11.0, 22.0, 15.0, 19.0, 29.0, 26.0, 28.0, 32.0, 30.0, 33.0, 44.0, 50.0, 33.0, 28.0, 37.0, 43.0, 48.0, 45.0, 34.0, 45.0, 31.0, 36.0, 25.0, 18.0, 27.0, 17.0, 17.0, 21.0, 20.0, 9.0, 12.0, 6.0, 8.0, 3.0, 11.0, 11.0, 4.0, 1.0, 6.0, 3.0, 2.0, 1.0, 3.0], "bins": [-16.453125, -15.99462890625, -15.5361328125, -15.07763671875, -14.619140625, -14.16064453125, -13.7021484375, -13.24365234375, -12.78515625, -12.32666015625, -11.8681640625, -11.40966796875, -10.951171875, -10.49267578125, -10.0341796875, -9.57568359375, -9.1171875, -8.65869140625, -8.2001953125, -7.74169921875, -7.283203125, -6.82470703125, -6.3662109375, -5.90771484375, -5.44921875, -4.99072265625, -4.5322265625, -4.07373046875, -3.615234375, -3.15673828125, -2.6982421875, -2.23974609375, -1.78125, -1.32275390625, -0.8642578125, -0.40576171875, 0.052734375, 0.51123046875, 0.9697265625, 1.42822265625, 1.88671875, 2.34521484375, 2.8037109375, 3.26220703125, 3.720703125, 4.17919921875, 4.6376953125, 5.09619140625, 5.5546875, 6.01318359375, 6.4716796875, 6.93017578125, 7.388671875, 7.84716796875, 8.3056640625, 8.76416015625, 9.22265625, 9.68115234375, 10.1396484375, 10.59814453125, 11.056640625, 11.51513671875, 11.9736328125, 12.43212890625, 12.890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 8.0, 5.0, 15.0, 14.0, 28.0, 31.0, 63.0, 76.0, 114.0, 174.0, 247.0, 389.0, 582.0, 904.0, 1380.0, 2120.0, 3399.0, 5850.0, 10181.0, 18845.0, 38489.0, 81884.0, 173060.0, 273137.0, 219579.0, 110692.0, 50635.0, 24977.0, 12968.0, 7194.0, 4203.0, 2566.0, 1646.0, 1095.0, 675.0, 442.0, 290.0, 201.0, 138.0, 89.0, 59.0, 35.0, 26.0, 22.0, 8.0, 11.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.8125, -17.25048828125, -16.6884765625, -16.12646484375, -15.564453125, -15.00244140625, -14.4404296875, -13.87841796875, -13.31640625, -12.75439453125, -12.1923828125, -11.63037109375, -11.068359375, -10.50634765625, -9.9443359375, -9.38232421875, -8.8203125, -8.25830078125, -7.6962890625, -7.13427734375, -6.572265625, -6.01025390625, -5.4482421875, -4.88623046875, -4.32421875, -3.76220703125, -3.2001953125, -2.63818359375, -2.076171875, -1.51416015625, -0.9521484375, -0.39013671875, 0.171875, 0.73388671875, 1.2958984375, 1.85791015625, 2.419921875, 2.98193359375, 3.5439453125, 4.10595703125, 4.66796875, 5.22998046875, 5.7919921875, 6.35400390625, 6.916015625, 7.47802734375, 8.0400390625, 8.60205078125, 9.1640625, 9.72607421875, 10.2880859375, 10.85009765625, 11.412109375, 11.97412109375, 12.5361328125, 13.09814453125, 13.66015625, 14.22216796875, 14.7841796875, 15.34619140625, 15.908203125, 16.47021484375, 17.0322265625, 17.59423828125, 18.15625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 6.0, 9.0, 14.0, 23.0, 28.0, 43.0, 62.0, 80.0, 90.0, 111.0, 91.0, 99.0, 92.0, 54.0, 38.0, 20.0, 22.0, 15.0, 17.0, 9.0, 10.0, 8.0, 6.0, 9.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015077590942382812, -0.0014591217041015625, -0.0014104843139648438, -0.001361846923828125, -0.0013132095336914062, -0.0012645721435546875, -0.0012159347534179688, -0.00116729736328125, -0.0011186599731445312, -0.0010700225830078125, -0.0010213851928710938, -0.000972747802734375, -0.0009241104125976562, -0.0008754730224609375, -0.0008268356323242188, -0.0007781982421875, -0.0007295608520507812, -0.0006809234619140625, -0.0006322860717773438, -0.000583648681640625, -0.0005350112915039062, -0.0004863739013671875, -0.00043773651123046875, -0.00038909912109375, -0.00034046173095703125, -0.0002918243408203125, -0.00024318695068359375, -0.000194549560546875, -0.00014591217041015625, -9.72747802734375e-05, -4.863739013671875e-05, 0.0, 4.863739013671875e-05, 9.72747802734375e-05, 0.00014591217041015625, 0.000194549560546875, 0.00024318695068359375, 0.0002918243408203125, 0.00034046173095703125, 0.00038909912109375, 0.00043773651123046875, 0.0004863739013671875, 0.0005350112915039062, 0.000583648681640625, 0.0006322860717773438, 0.0006809234619140625, 0.0007295608520507812, 0.0007781982421875, 0.0008268356323242188, 0.0008754730224609375, 0.0009241104125976562, 0.000972747802734375, 0.0010213851928710938, 0.0010700225830078125, 0.0011186599731445312, 0.00116729736328125, 0.0012159347534179688, 0.0012645721435546875, 0.0013132095336914062, 0.001361846923828125, 0.0014104843139648438, 0.0014591217041015625, 0.0015077590942382812, 0.001556396484375, 0.0016050338745117188]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 9.0, 6.0, 21.0, 30.0, 34.0, 84.0, 84.0, 138.0, 242.0, 335.0, 530.0, 892.0, 1523.0, 2662.0, 4880.0, 9145.0, 17679.0, 35278.0, 69995.0, 129472.0, 201296.0, 221061.0, 162301.0, 92698.0, 47580.0, 23940.0, 12092.0, 6190.0, 3369.0, 2019.0, 1092.0, 690.0, 405.0, 268.0, 184.0, 107.0, 80.0, 43.0, 37.0, 21.0, 13.0, 10.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.4375, -16.896240234375, -16.35498046875, -15.813720703125, -15.2724609375, -14.731201171875, -14.18994140625, -13.648681640625, -13.107421875, -12.566162109375, -12.02490234375, -11.483642578125, -10.9423828125, -10.401123046875, -9.85986328125, -9.318603515625, -8.77734375, -8.236083984375, -7.69482421875, -7.153564453125, -6.6123046875, -6.071044921875, -5.52978515625, -4.988525390625, -4.447265625, -3.906005859375, -3.36474609375, -2.823486328125, -2.2822265625, -1.740966796875, -1.19970703125, -0.658447265625, -0.1171875, 0.424072265625, 0.96533203125, 1.506591796875, 2.0478515625, 2.589111328125, 3.13037109375, 3.671630859375, 4.212890625, 4.754150390625, 5.29541015625, 5.836669921875, 6.3779296875, 6.919189453125, 7.46044921875, 8.001708984375, 8.54296875, 9.084228515625, 9.62548828125, 10.166748046875, 10.7080078125, 11.249267578125, 11.79052734375, 12.331787109375, 12.873046875, 13.414306640625, 13.95556640625, 14.496826171875, 15.0380859375, 15.579345703125, 16.12060546875, 16.661865234375, 17.203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 5.0, 12.0, 10.0, 13.0, 12.0, 23.0, 25.0, 33.0, 40.0, 40.0, 40.0, 51.0, 66.0, 79.0, 70.0, 77.0, 59.0, 65.0, 41.0, 45.0, 36.0, 32.0, 19.0, 20.0, 20.0, 6.0, 8.0, 13.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-6.671875, -6.4896240234375, -6.307373046875, -6.1251220703125, -5.94287109375, -5.7606201171875, -5.578369140625, -5.3961181640625, -5.2138671875, -5.0316162109375, -4.849365234375, -4.6671142578125, -4.48486328125, -4.3026123046875, -4.120361328125, -3.9381103515625, -3.755859375, -3.5736083984375, -3.391357421875, -3.2091064453125, -3.02685546875, -2.8446044921875, -2.662353515625, -2.4801025390625, -2.2978515625, -2.1156005859375, -1.933349609375, -1.7510986328125, -1.56884765625, -1.3865966796875, -1.204345703125, -1.0220947265625, -0.83984375, -0.6575927734375, -0.475341796875, -0.2930908203125, -0.11083984375, 0.0714111328125, 0.253662109375, 0.4359130859375, 0.6181640625, 0.8004150390625, 0.982666015625, 1.1649169921875, 1.34716796875, 1.5294189453125, 1.711669921875, 1.8939208984375, 2.076171875, 2.2584228515625, 2.440673828125, 2.6229248046875, 2.80517578125, 2.9874267578125, 3.169677734375, 3.3519287109375, 3.5341796875, 3.7164306640625, 3.898681640625, 4.0809326171875, 4.26318359375, 4.4454345703125, 4.627685546875, 4.8099365234375, 4.9921875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 3.0, 2.0, 3.0, 7.0, 3.0, 6.0, 9.0, 15.0, 11.0, 20.0, 23.0, 21.0, 25.0, 25.0, 35.0, 35.0, 52.0, 41.0, 43.0, 53.0, 47.0, 44.0, 48.0, 53.0, 42.0, 43.0, 41.0, 46.0, 35.0, 33.0, 19.0, 26.0, 15.0, 21.0, 17.0, 12.0, 11.0, 4.0, 7.0, 3.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.835206985473633, -18.094234466552734, -17.35326385498047, -16.61229133605957, -15.871318817138672, -15.13034725189209, -14.389375686645508, -13.64840316772461, -12.907431602478027, -12.166460037231445, -11.425487518310547, -10.684515953063965, -9.943544387817383, -9.202571868896484, -8.461600303649902, -7.720628261566162, -6.979656219482422, -6.238684177398682, -5.497712135314941, -4.756740570068359, -4.015768527984619, -3.274796485900879, -2.533824920654297, -1.7928528785705566, -1.0518808364868164, -0.3109089136123657, 0.43006300926208496, 1.171034812927246, 1.9120068550109863, 2.6529788970947266, 3.3939504623413086, 4.134922504425049, 4.875894546508789, 5.616866588592529, 6.3578386306762695, 7.098810195922852, 7.839782238006592, 8.580754280090332, 9.321725845336914, 10.062698364257812, 10.803669929504395, 11.544641494750977, 12.285614013671875, 13.026585578918457, 13.767557144165039, 14.508529663085938, 15.24950122833252, 15.990472793579102, 16.7314453125, 17.4724178314209, 18.213388442993164, 18.954360961914062, 19.69533348083496, 20.43630599975586, 21.177276611328125, 21.918249130249023, 22.659221649169922, 23.40019416809082, 24.141164779663086, 24.882137298583984, 25.623109817504883, 26.36408233642578, 27.105052947998047, 27.846025466918945, 28.58699607849121]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 6.0, 2.0, 5.0, 8.0, 13.0, 11.0, 7.0, 15.0, 21.0, 25.0, 22.0, 28.0, 29.0, 20.0, 34.0, 33.0, 33.0, 37.0, 43.0, 34.0, 45.0, 53.0, 46.0, 33.0, 40.0, 41.0, 37.0, 34.0, 22.0, 28.0, 27.0, 20.0, 28.0, 22.0, 19.0, 11.0, 16.0, 6.0, 14.0, 6.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.401037216186523, -21.73367691040039, -21.066314697265625, -20.398954391479492, -19.73159408569336, -19.064233779907227, -18.396873474121094, -17.729511260986328, -17.062150955200195, -16.394790649414062, -15.727429389953613, -15.060068130493164, -14.392707824707031, -13.725347518920898, -13.05798625946045, -12.390625, -11.723264694213867, -11.055904388427734, -10.388543128967285, -9.721181869506836, -9.053821563720703, -8.38646125793457, -7.719099998474121, -7.05173921585083, -6.384378433227539, -5.717017650604248, -5.049656867980957, -4.382296085357666, -3.714935302734375, -3.047574520111084, -2.380213737487793, -1.712852954864502, -1.045492172241211, -0.3781313896179199, 0.2892293930053711, 0.9565901756286621, 1.6239509582519531, 2.291311740875244, 2.958672523498535, 3.626033306121826, 4.293394088745117, 4.960754871368408, 5.628115653991699, 6.29547643661499, 6.962837219238281, 7.630198001861572, 8.297558784484863, 8.964920043945312, 9.632280349731445, 10.299640655517578, 10.967001914978027, 11.634363174438477, 12.30172348022461, 12.969083786010742, 13.636445045471191, 14.30380630493164, 14.971166610717773, 15.638526916503906, 16.305889129638672, 16.973249435424805, 17.640609741210938, 18.30797004699707, 18.975330352783203, 19.64269256591797, 20.3100528717041]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 0.0, 3.0, 9.0, 13.0, 25.0, 42.0, 66.0, 111.0, 205.0, 326.0, 456.0, 784.0, 1244.0, 2022.0, 3365.0, 5427.0, 8735.0, 13675.0, 20771.0, 31196.0, 44752.0, 61385.0, 80027.0, 96494.0, 108949.0, 112842.0, 106634.0, 93116.0, 75662.0, 57570.0, 41599.0, 28781.0, 19281.0, 12419.0, 7739.0, 4966.0, 2998.0, 1889.0, 1140.0, 728.0, 435.0, 250.0, 159.0, 86.0, 79.0, 47.0, 20.0, 16.0, 12.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.5546875, -15.0888671875, -14.623046875, -14.1572265625, -13.69140625, -13.2255859375, -12.759765625, -12.2939453125, -11.828125, -11.3623046875, -10.896484375, -10.4306640625, -9.96484375, -9.4990234375, -9.033203125, -8.5673828125, -8.1015625, -7.6357421875, -7.169921875, -6.7041015625, -6.23828125, -5.7724609375, -5.306640625, -4.8408203125, -4.375, -3.9091796875, -3.443359375, -2.9775390625, -2.51171875, -2.0458984375, -1.580078125, -1.1142578125, -0.6484375, -0.1826171875, 0.283203125, 0.7490234375, 1.21484375, 1.6806640625, 2.146484375, 2.6123046875, 3.078125, 3.5439453125, 4.009765625, 4.4755859375, 4.94140625, 5.4072265625, 5.873046875, 6.3388671875, 6.8046875, 7.2705078125, 7.736328125, 8.2021484375, 8.66796875, 9.1337890625, 9.599609375, 10.0654296875, 10.53125, 10.9970703125, 11.462890625, 11.9287109375, 12.39453125, 12.8603515625, 13.326171875, 13.7919921875, 14.2578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 10.0, 12.0, 13.0, 16.0, 25.0, 21.0, 27.0, 33.0, 23.0, 35.0, 42.0, 25.0, 35.0, 40.0, 50.0, 53.0, 32.0, 38.0, 46.0, 47.0, 38.0, 25.0, 43.0, 34.0, 31.0, 30.0, 23.0, 16.0, 23.0, 17.0, 15.0, 15.0, 8.0, 10.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.71875, -21.03271484375, -20.3466796875, -19.66064453125, -18.974609375, -18.28857421875, -17.6025390625, -16.91650390625, -16.23046875, -15.54443359375, -14.8583984375, -14.17236328125, -13.486328125, -12.80029296875, -12.1142578125, -11.42822265625, -10.7421875, -10.05615234375, -9.3701171875, -8.68408203125, -7.998046875, -7.31201171875, -6.6259765625, -5.93994140625, -5.25390625, -4.56787109375, -3.8818359375, -3.19580078125, -2.509765625, -1.82373046875, -1.1376953125, -0.45166015625, 0.234375, 0.92041015625, 1.6064453125, 2.29248046875, 2.978515625, 3.66455078125, 4.3505859375, 5.03662109375, 5.72265625, 6.40869140625, 7.0947265625, 7.78076171875, 8.466796875, 9.15283203125, 9.8388671875, 10.52490234375, 11.2109375, 11.89697265625, 12.5830078125, 13.26904296875, 13.955078125, 14.64111328125, 15.3271484375, 16.01318359375, 16.69921875, 17.38525390625, 18.0712890625, 18.75732421875, 19.443359375, 20.12939453125, 20.8154296875, 21.50146484375, 22.1875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 13.0, 13.0, 34.0, 40.0, 55.0, 76.0, 135.0, 205.0, 301.0, 453.0, 663.0, 1097.0, 1739.0, 2671.0, 4218.0, 6807.0, 10762.0, 16657.0, 25109.0, 37904.0, 54530.0, 73889.0, 92937.0, 109375.0, 116967.0, 114192.0, 101085.0, 82363.0, 62332.0, 44793.0, 30916.0, 20142.0, 13089.0, 8437.0, 5280.0, 3350.0, 2116.0, 1364.0, 863.0, 578.0, 344.0, 216.0, 150.0, 92.0, 60.0, 45.0, 33.0, 26.0, 15.0, 10.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0], "bins": [-16.90625, -16.3896484375, -15.873046875, -15.3564453125, -14.83984375, -14.3232421875, -13.806640625, -13.2900390625, -12.7734375, -12.2568359375, -11.740234375, -11.2236328125, -10.70703125, -10.1904296875, -9.673828125, -9.1572265625, -8.640625, -8.1240234375, -7.607421875, -7.0908203125, -6.57421875, -6.0576171875, -5.541015625, -5.0244140625, -4.5078125, -3.9912109375, -3.474609375, -2.9580078125, -2.44140625, -1.9248046875, -1.408203125, -0.8916015625, -0.375, 0.1416015625, 0.658203125, 1.1748046875, 1.69140625, 2.2080078125, 2.724609375, 3.2412109375, 3.7578125, 4.2744140625, 4.791015625, 5.3076171875, 5.82421875, 6.3408203125, 6.857421875, 7.3740234375, 7.890625, 8.4072265625, 8.923828125, 9.4404296875, 9.95703125, 10.4736328125, 10.990234375, 11.5068359375, 12.0234375, 12.5400390625, 13.056640625, 13.5732421875, 14.08984375, 14.6064453125, 15.123046875, 15.6396484375, 16.15625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 3.0, 6.0, 4.0, 7.0, 5.0, 8.0, 11.0, 14.0, 15.0, 25.0, 30.0, 18.0, 35.0, 23.0, 27.0, 40.0, 22.0, 31.0, 26.0, 32.0, 34.0, 42.0, 39.0, 42.0, 32.0, 38.0, 45.0, 39.0, 33.0, 31.0, 38.0, 19.0, 20.0, 15.0, 21.0, 22.0, 18.0, 20.0, 13.0, 12.0, 10.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 4.0, 6.0, 0.0, 4.0, 0.0, 1.0], "bins": [-12.90625, -12.5198974609375, -12.133544921875, -11.7471923828125, -11.36083984375, -10.9744873046875, -10.588134765625, -10.2017822265625, -9.8154296875, -9.4290771484375, -9.042724609375, -8.6563720703125, -8.27001953125, -7.8836669921875, -7.497314453125, -7.1109619140625, -6.724609375, -6.3382568359375, -5.951904296875, -5.5655517578125, -5.17919921875, -4.7928466796875, -4.406494140625, -4.0201416015625, -3.6337890625, -3.2474365234375, -2.861083984375, -2.4747314453125, -2.08837890625, -1.7020263671875, -1.315673828125, -0.9293212890625, -0.54296875, -0.1566162109375, 0.229736328125, 0.6160888671875, 1.00244140625, 1.3887939453125, 1.775146484375, 2.1614990234375, 2.5478515625, 2.9342041015625, 3.320556640625, 3.7069091796875, 4.09326171875, 4.4796142578125, 4.865966796875, 5.2523193359375, 5.638671875, 6.0250244140625, 6.411376953125, 6.7977294921875, 7.18408203125, 7.5704345703125, 7.956787109375, 8.3431396484375, 8.7294921875, 9.1158447265625, 9.502197265625, 9.8885498046875, 10.27490234375, 10.6612548828125, 11.047607421875, 11.4339599609375, 11.8203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 14.0, 21.0, 34.0, 48.0, 86.0, 152.0, 223.0, 388.0, 615.0, 1037.0, 1796.0, 3053.0, 4993.0, 8547.0, 14239.0, 23974.0, 39212.0, 60616.0, 89661.0, 119760.0, 141035.0, 143189.0, 125228.0, 95909.0, 66234.0, 42858.0, 26293.0, 15909.0, 9464.0, 5717.0, 3335.0, 1945.0, 1204.0, 715.0, 416.0, 256.0, 161.0, 88.0, 52.0, 33.0, 13.0, 11.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.046875, -7.79620361328125, -7.5455322265625, -7.29486083984375, -7.044189453125, -6.79351806640625, -6.5428466796875, -6.29217529296875, -6.04150390625, -5.79083251953125, -5.5401611328125, -5.28948974609375, -5.038818359375, -4.78814697265625, -4.5374755859375, -4.28680419921875, -4.0361328125, -3.78546142578125, -3.5347900390625, -3.28411865234375, -3.033447265625, -2.78277587890625, -2.5321044921875, -2.28143310546875, -2.03076171875, -1.78009033203125, -1.5294189453125, -1.27874755859375, -1.028076171875, -0.77740478515625, -0.5267333984375, -0.27606201171875, -0.025390625, 0.22528076171875, 0.4759521484375, 0.72662353515625, 0.977294921875, 1.22796630859375, 1.4786376953125, 1.72930908203125, 1.97998046875, 2.23065185546875, 2.4813232421875, 2.73199462890625, 2.982666015625, 3.23333740234375, 3.4840087890625, 3.73468017578125, 3.9853515625, 4.23602294921875, 4.4866943359375, 4.73736572265625, 4.988037109375, 5.23870849609375, 5.4893798828125, 5.74005126953125, 5.99072265625, 6.24139404296875, 6.4920654296875, 6.74273681640625, 6.993408203125, 7.24407958984375, 7.4947509765625, 7.74542236328125, 7.99609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 9.0, 8.0, 10.0, 17.0, 12.0, 16.0, 22.0, 23.0, 33.0, 40.0, 31.0, 38.0, 47.0, 56.0, 53.0, 52.0, 49.0, 48.0, 51.0, 57.0, 54.0, 39.0, 35.0, 38.0, 33.0, 18.0, 27.0, 17.0, 11.0, 15.0, 8.0, 9.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007271766662597656, -0.0006975308060646057, -0.0006678849458694458, -0.0006382390856742859, -0.000608593225479126, -0.0005789473652839661, -0.0005493015050888062, -0.0005196556448936462, -0.0004900097846984863, -0.0004603639245033264, -0.0004307180643081665, -0.0004010722041130066, -0.0003714263439178467, -0.00034178048372268677, -0.00031213462352752686, -0.00028248876333236694, -0.00025284290313720703, -0.00022319704294204712, -0.0001935511827468872, -0.0001639053225517273, -0.00013425946235656738, -0.00010461360216140747, -7.496774196624756e-05, -4.5321881771087646e-05, -1.5676021575927734e-05, 1.3969838619232178e-05, 4.361569881439209e-05, 7.3261559009552e-05, 0.00010290741920471191, 0.00013255327939987183, 0.00016219913959503174, 0.00019184499979019165, 0.00022149085998535156, 0.0002511367201805115, 0.0002807825803756714, 0.0003104284405708313, 0.0003400743007659912, 0.0003697201609611511, 0.00039936602115631104, 0.00042901188135147095, 0.00045865774154663086, 0.0004883036017417908, 0.0005179494619369507, 0.0005475953221321106, 0.0005772411823272705, 0.0006068870425224304, 0.0006365329027175903, 0.0006661787629127502, 0.0006958246231079102, 0.0007254704833030701, 0.00075511634349823, 0.0007847622036933899, 0.0008144080638885498, 0.0008440539240837097, 0.0008736997842788696, 0.0009033456444740295, 0.0009329915046691895, 0.0009626373648643494, 0.0009922832250595093, 0.0010219290852546692, 0.001051574945449829, 0.001081220805644989, 0.001110866665840149, 0.0011405125260353088, 0.0011701583862304688]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 10.0, 15.0, 24.0, 22.0, 51.0, 58.0, 107.0, 152.0, 265.0, 431.0, 761.0, 1341.0, 2258.0, 3922.0, 7142.0, 12678.0, 21715.0, 35810.0, 57630.0, 85680.0, 115920.0, 138994.0, 144600.0, 130304.0, 102630.0, 71731.0, 46674.0, 28634.0, 16594.0, 9622.0, 5443.0, 3057.0, 1749.0, 1030.0, 569.0, 383.0, 222.0, 116.0, 71.0, 49.0, 29.0, 15.0, 13.0, 8.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.03125, -7.7823486328125, -7.533447265625, -7.2845458984375, -7.03564453125, -6.7867431640625, -6.537841796875, -6.2889404296875, -6.0400390625, -5.7911376953125, -5.542236328125, -5.2933349609375, -5.04443359375, -4.7955322265625, -4.546630859375, -4.2977294921875, -4.048828125, -3.7999267578125, -3.551025390625, -3.3021240234375, -3.05322265625, -2.8043212890625, -2.555419921875, -2.3065185546875, -2.0576171875, -1.8087158203125, -1.559814453125, -1.3109130859375, -1.06201171875, -0.8131103515625, -0.564208984375, -0.3153076171875, -0.06640625, 0.1824951171875, 0.431396484375, 0.6802978515625, 0.92919921875, 1.1781005859375, 1.427001953125, 1.6759033203125, 1.9248046875, 2.1737060546875, 2.422607421875, 2.6715087890625, 2.92041015625, 3.1693115234375, 3.418212890625, 3.6671142578125, 3.916015625, 4.1649169921875, 4.413818359375, 4.6627197265625, 4.91162109375, 5.1605224609375, 5.409423828125, 5.6583251953125, 5.9072265625, 6.1561279296875, 6.405029296875, 6.6539306640625, 6.90283203125, 7.1517333984375, 7.400634765625, 7.6495361328125, 7.8984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 4.0, 10.0, 9.0, 8.0, 12.0, 16.0, 16.0, 18.0, 28.0, 31.0, 48.0, 45.0, 43.0, 40.0, 45.0, 48.0, 52.0, 39.0, 55.0, 50.0, 40.0, 51.0, 45.0, 36.0, 24.0, 20.0, 20.0, 28.0, 18.0, 21.0, 14.0, 12.0, 6.0, 8.0, 9.0, 6.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.32293701171875, -2.2376708984375, -2.15240478515625, -2.067138671875, -1.98187255859375, -1.8966064453125, -1.81134033203125, -1.72607421875, -1.64080810546875, -1.5555419921875, -1.47027587890625, -1.385009765625, -1.29974365234375, -1.2144775390625, -1.12921142578125, -1.0439453125, -0.95867919921875, -0.8734130859375, -0.78814697265625, -0.702880859375, -0.61761474609375, -0.5323486328125, -0.44708251953125, -0.36181640625, -0.27655029296875, -0.1912841796875, -0.10601806640625, -0.020751953125, 0.06451416015625, 0.1497802734375, 0.23504638671875, 0.3203125, 0.40557861328125, 0.4908447265625, 0.57611083984375, 0.661376953125, 0.74664306640625, 0.8319091796875, 0.91717529296875, 1.00244140625, 1.08770751953125, 1.1729736328125, 1.25823974609375, 1.343505859375, 1.42877197265625, 1.5140380859375, 1.59930419921875, 1.6845703125, 1.76983642578125, 1.8551025390625, 1.94036865234375, 2.025634765625, 2.11090087890625, 2.1961669921875, 2.28143310546875, 2.36669921875, 2.45196533203125, 2.5372314453125, 2.62249755859375, 2.707763671875, 2.79302978515625, 2.8782958984375, 2.96356201171875, 3.048828125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 4.0, 10.0, 12.0, 17.0, 12.0, 22.0, 18.0, 17.0, 33.0, 32.0, 30.0, 33.0, 40.0, 44.0, 38.0, 45.0, 50.0, 43.0, 44.0, 41.0, 41.0, 43.0, 41.0, 35.0, 38.0, 36.0, 30.0, 27.0, 17.0, 24.0, 22.0, 11.0, 8.0, 8.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.8098087310791, -21.138233184814453, -20.466657638549805, -19.795082092285156, -19.12350845336914, -18.451932907104492, -17.780357360839844, -17.108781814575195, -16.437206268310547, -15.765630722045898, -15.094056129455566, -14.422480583190918, -13.750905990600586, -13.079330444335938, -12.407754898071289, -11.73617935180664, -11.064605712890625, -10.393030166625977, -9.721455574035645, -9.049880027770996, -8.378305435180664, -7.706729888916016, -7.035154342651367, -6.363579273223877, -5.692004203796387, -5.0204291343688965, -4.348854064941406, -3.677278518676758, -3.0057034492492676, -2.3341283798217773, -1.662552833557129, -0.9909777641296387, -0.31940460205078125, 0.35217058658599854, 1.0237457752227783, 1.6953210830688477, 2.366896152496338, 3.038471221923828, 3.7100467681884766, 4.381621837615967, 5.053196907043457, 5.724771976470947, 6.3963470458984375, 7.067922592163086, 7.739497661590576, 8.411072731018066, 9.082648277282715, 9.754222869873047, 10.425798416137695, 11.097373962402344, 11.768948554992676, 12.440524101257324, 13.112098693847656, 13.783674240112305, 14.455249786376953, 15.126825332641602, 15.798399925231934, 16.469974517822266, 17.141550064086914, 17.813125610351562, 18.48470115661621, 19.15627670288086, 19.827850341796875, 20.499425888061523, 21.171001434326172]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 5.0, 7.0, 17.0, 8.0, 6.0, 9.0, 17.0, 13.0, 23.0, 24.0, 19.0, 32.0, 33.0, 23.0, 31.0, 35.0, 47.0, 58.0, 28.0, 48.0, 43.0, 46.0, 25.0, 39.0, 35.0, 35.0, 40.0, 44.0, 21.0, 23.0, 16.0, 26.0, 22.0, 19.0, 8.0, 11.0, 10.0, 11.0, 6.0, 10.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.029443740844727, -20.367202758789062, -19.7049617767334, -19.042720794677734, -18.38047981262207, -17.718238830566406, -17.05599594116211, -16.393754959106445, -15.731513977050781, -15.069272994995117, -14.407032012939453, -13.744791030883789, -13.082549095153809, -12.420308113098145, -11.75806713104248, -11.0958251953125, -10.433585166931152, -9.771344184875488, -9.109103202819824, -8.446861267089844, -7.78462028503418, -7.122379302978516, -6.460138320922852, -5.797896862030029, -5.135655879974365, -4.473414897918701, -3.811173439025879, -3.148932456970215, -2.4866912364959717, -1.8244500160217285, -1.1622090339660645, -0.4999675750732422, 0.16227340698242188, 0.8245145678520203, 1.4867557287216187, 2.1489968299865723, 2.8112380504608154, 3.4734792709350586, 4.135720252990723, 4.797961711883545, 5.460202693939209, 6.122443675994873, 6.784685134887695, 7.446926116943359, 8.109167098999023, 8.771408081054688, 9.433649063110352, 10.095890998840332, 10.758131980895996, 11.42037296295166, 12.082613945007324, 12.744855880737305, 13.407096862792969, 14.069337844848633, 14.731578826904297, 15.393819808959961, 16.056060791015625, 16.71830177307129, 17.380542755126953, 18.042783737182617, 18.70502471923828, 19.367267608642578, 20.02950668334961, 20.691749572753906, 21.35399055480957]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 13.0, 9.0, 23.0, 37.0, 35.0, 57.0, 88.0, 134.0, 202.0, 297.0, 529.0, 908.0, 1342.0, 2239.0, 3789.0, 6367.0, 10961.0, 19143.0, 33886.0, 61417.0, 112748.0, 201629.0, 342803.0, 521297.0, 669180.0, 691780.0, 573551.0, 393460.0, 238562.0, 135125.0, 74692.0, 41494.0, 23387.0, 13412.0, 7821.0, 4742.0, 2753.0, 1694.0, 994.0, 645.0, 397.0, 243.0, 147.0, 99.0, 50.0, 37.0, 26.0, 19.0, 15.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.953125, -17.394775390625, -16.83642578125, -16.278076171875, -15.7197265625, -15.161376953125, -14.60302734375, -14.044677734375, -13.486328125, -12.927978515625, -12.36962890625, -11.811279296875, -11.2529296875, -10.694580078125, -10.13623046875, -9.577880859375, -9.01953125, -8.461181640625, -7.90283203125, -7.344482421875, -6.7861328125, -6.227783203125, -5.66943359375, -5.111083984375, -4.552734375, -3.994384765625, -3.43603515625, -2.877685546875, -2.3193359375, -1.760986328125, -1.20263671875, -0.644287109375, -0.0859375, 0.472412109375, 1.03076171875, 1.589111328125, 2.1474609375, 2.705810546875, 3.26416015625, 3.822509765625, 4.380859375, 4.939208984375, 5.49755859375, 6.055908203125, 6.6142578125, 7.172607421875, 7.73095703125, 8.289306640625, 8.84765625, 9.406005859375, 9.96435546875, 10.522705078125, 11.0810546875, 11.639404296875, 12.19775390625, 12.756103515625, 13.314453125, 13.872802734375, 14.43115234375, 14.989501953125, 15.5478515625, 16.106201171875, 16.66455078125, 17.222900390625, 17.78125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 10.0, 11.0, 14.0, 14.0, 17.0, 18.0, 22.0, 34.0, 31.0, 36.0, 38.0, 34.0, 36.0, 48.0, 35.0, 54.0, 49.0, 51.0, 47.0, 37.0, 45.0, 38.0, 35.0, 39.0, 22.0, 26.0, 15.0, 27.0, 22.0, 15.0, 15.0, 7.0, 12.0, 13.0, 6.0, 4.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.03125, -20.39208984375, -19.7529296875, -19.11376953125, -18.474609375, -17.83544921875, -17.1962890625, -16.55712890625, -15.91796875, -15.27880859375, -14.6396484375, -14.00048828125, -13.361328125, -12.72216796875, -12.0830078125, -11.44384765625, -10.8046875, -10.16552734375, -9.5263671875, -8.88720703125, -8.248046875, -7.60888671875, -6.9697265625, -6.33056640625, -5.69140625, -5.05224609375, -4.4130859375, -3.77392578125, -3.134765625, -2.49560546875, -1.8564453125, -1.21728515625, -0.578125, 0.06103515625, 0.7001953125, 1.33935546875, 1.978515625, 2.61767578125, 3.2568359375, 3.89599609375, 4.53515625, 5.17431640625, 5.8134765625, 6.45263671875, 7.091796875, 7.73095703125, 8.3701171875, 9.00927734375, 9.6484375, 10.28759765625, 10.9267578125, 11.56591796875, 12.205078125, 12.84423828125, 13.4833984375, 14.12255859375, 14.76171875, 15.40087890625, 16.0400390625, 16.67919921875, 17.318359375, 17.95751953125, 18.5966796875, 19.23583984375, 19.875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 4.0, 8.0, 17.0, 59.0, 57.0, 108.0, 184.0, 310.0, 497.0, 843.0, 1510.0, 2626.0, 4738.0, 8520.0, 15014.0, 26996.0, 48792.0, 87159.0, 152838.0, 259024.0, 409223.0, 579404.0, 683271.0, 642734.0, 489873.0, 323748.0, 196655.0, 114308.0, 64509.0, 36105.0, 19693.0, 10961.0, 6219.0, 3561.0, 1920.0, 1115.0, 703.0, 403.0, 242.0, 130.0, 79.0, 62.0, 26.0, 13.0, 10.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.875, -21.2265625, -20.578125, -19.9296875, -19.28125, -18.6328125, -17.984375, -17.3359375, -16.6875, -16.0390625, -15.390625, -14.7421875, -14.09375, -13.4453125, -12.796875, -12.1484375, -11.5, -10.8515625, -10.203125, -9.5546875, -8.90625, -8.2578125, -7.609375, -6.9609375, -6.3125, -5.6640625, -5.015625, -4.3671875, -3.71875, -3.0703125, -2.421875, -1.7734375, -1.125, -0.4765625, 0.171875, 0.8203125, 1.46875, 2.1171875, 2.765625, 3.4140625, 4.0625, 4.7109375, 5.359375, 6.0078125, 6.65625, 7.3046875, 7.953125, 8.6015625, 9.25, 9.8984375, 10.546875, 11.1953125, 11.84375, 12.4921875, 13.140625, 13.7890625, 14.4375, 15.0859375, 15.734375, 16.3828125, 17.03125, 17.6796875, 18.328125, 18.9765625, 19.625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 10.0, 5.0, 15.0, 15.0, 23.0, 24.0, 37.0, 45.0, 70.0, 59.0, 82.0, 96.0, 123.0, 144.0, 150.0, 157.0, 178.0, 201.0, 216.0, 257.0, 218.0, 238.0, 226.0, 212.0, 204.0, 196.0, 139.0, 123.0, 131.0, 91.0, 81.0, 72.0, 50.0, 42.0, 39.0, 33.0, 25.0, 13.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.71875, -8.4659423828125, -8.213134765625, -7.9603271484375, -7.70751953125, -7.4547119140625, -7.201904296875, -6.9490966796875, -6.6962890625, -6.4434814453125, -6.190673828125, -5.9378662109375, -5.68505859375, -5.4322509765625, -5.179443359375, -4.9266357421875, -4.673828125, -4.4210205078125, -4.168212890625, -3.9154052734375, -3.66259765625, -3.4097900390625, -3.156982421875, -2.9041748046875, -2.6513671875, -2.3985595703125, -2.145751953125, -1.8929443359375, -1.64013671875, -1.3873291015625, -1.134521484375, -0.8817138671875, -0.62890625, -0.3760986328125, -0.123291015625, 0.1295166015625, 0.38232421875, 0.6351318359375, 0.887939453125, 1.1407470703125, 1.3935546875, 1.6463623046875, 1.899169921875, 2.1519775390625, 2.40478515625, 2.6575927734375, 2.910400390625, 3.1632080078125, 3.416015625, 3.6688232421875, 3.921630859375, 4.1744384765625, 4.42724609375, 4.6800537109375, 4.932861328125, 5.1856689453125, 5.4384765625, 5.6912841796875, 5.944091796875, 6.1968994140625, 6.44970703125, 6.7025146484375, 6.955322265625, 7.2081298828125, 7.4609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 4.0, 10.0, 12.0, 9.0, 9.0, 11.0, 14.0, 17.0, 20.0, 22.0, 23.0, 22.0, 43.0, 38.0, 35.0, 36.0, 38.0, 56.0, 46.0, 38.0, 43.0, 30.0, 29.0, 37.0, 37.0, 37.0, 31.0, 32.0, 38.0, 28.0, 26.0, 22.0, 22.0, 13.0, 10.0, 11.0, 7.0, 10.0, 9.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.29783821105957, -19.682409286499023, -19.06698226928711, -18.451553344726562, -17.836124420166016, -17.22069549560547, -16.605266571044922, -15.989839553833008, -15.374410629272461, -14.758981704711914, -14.143553733825684, -13.528125762939453, -12.912696838378906, -12.29726791381836, -11.681839942932129, -11.066411972045898, -10.450983047485352, -9.835554122924805, -9.220126152038574, -8.604698181152344, -7.989269256591797, -7.373840808868408, -6.7584123611450195, -6.142983913421631, -5.527555465698242, -4.9121270179748535, -4.296698570251465, -3.681270122528076, -3.0658416748046875, -2.450413227081299, -1.8349847793579102, -1.2195563316345215, -0.6041259765625, 0.011302471160888672, 0.6267309188842773, 1.242159366607666, 1.8575878143310547, 2.4730162620544434, 3.088444709777832, 3.7038731575012207, 4.319301605224609, 4.934730052947998, 5.550158500671387, 6.165586948394775, 6.781015396118164, 7.396443843841553, 8.011872291564941, 8.627300262451172, 9.242729187011719, 9.858158111572266, 10.473586082458496, 11.089014053344727, 11.704442977905273, 12.31987190246582, 12.93529987335205, 13.550727844238281, 14.166156768798828, 14.781585693359375, 15.397013664245605, 16.012441635131836, 16.627870559692383, 17.24329948425293, 17.858726501464844, 18.47415542602539, 19.089584350585938]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 7.0, 3.0, 2.0, 9.0, 11.0, 12.0, 18.0, 15.0, 14.0, 16.0, 23.0, 23.0, 26.0, 28.0, 30.0, 23.0, 26.0, 36.0, 37.0, 53.0, 49.0, 43.0, 32.0, 29.0, 40.0, 32.0, 34.0, 39.0, 25.0, 29.0, 32.0, 28.0, 27.0, 22.0, 21.0, 9.0, 15.0, 10.0, 9.0, 14.0, 14.0, 8.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.31538200378418, -17.731037139892578, -17.146692276000977, -16.562347412109375, -15.97800350189209, -15.393658638000488, -14.809314727783203, -14.224969863891602, -13.640625, -13.056280136108398, -12.471935272216797, -11.887591361999512, -11.30324649810791, -10.718901634216309, -10.134557723999023, -9.550212860107422, -8.96586799621582, -8.381523132324219, -7.797178745269775, -7.212834358215332, -6.6284894943237305, -6.044144630432129, -5.4598002433776855, -4.875455856323242, -4.291110992431641, -3.706766366958618, -3.1224217414855957, -2.5380771160125732, -1.9537324905395508, -1.3693878650665283, -0.7850432395935059, -0.2006988525390625, 0.3836479187011719, 0.9679925441741943, 1.5523371696472168, 2.1366817951202393, 2.7210264205932617, 3.305371046066284, 3.8897156715393066, 4.47406005859375, 5.058404922485352, 5.642749786376953, 6.2270941734313965, 6.81143856048584, 7.395783424377441, 7.980128288269043, 8.564472198486328, 9.14881706237793, 9.733161926269531, 10.317506790161133, 10.901851654052734, 11.48619556427002, 12.070540428161621, 12.654885292053223, 13.239229202270508, 13.82357406616211, 14.407918930053711, 14.992263793945312, 15.576608657836914, 16.160953521728516, 16.745296478271484, 17.329641342163086, 17.913986206054688, 18.49833106994629, 19.08267593383789]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 11.0, 24.0, 32.0, 51.0, 90.0, 129.0, 223.0, 301.0, 508.0, 863.0, 1525.0, 2671.0, 4689.0, 8256.0, 14678.0, 25957.0, 44806.0, 74717.0, 114477.0, 152410.0, 167564.0, 150147.0, 111159.0, 72111.0, 43289.0, 25124.0, 14040.0, 7967.0, 4556.0, 2508.0, 1445.0, 884.0, 545.0, 294.0, 203.0, 106.0, 83.0, 40.0, 20.0, 18.0, 8.0, 11.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.953125, -17.400146484375, -16.84716796875, -16.294189453125, -15.7412109375, -15.188232421875, -14.63525390625, -14.082275390625, -13.529296875, -12.976318359375, -12.42333984375, -11.870361328125, -11.3173828125, -10.764404296875, -10.21142578125, -9.658447265625, -9.10546875, -8.552490234375, -7.99951171875, -7.446533203125, -6.8935546875, -6.340576171875, -5.78759765625, -5.234619140625, -4.681640625, -4.128662109375, -3.57568359375, -3.022705078125, -2.4697265625, -1.916748046875, -1.36376953125, -0.810791015625, -0.2578125, 0.295166015625, 0.84814453125, 1.401123046875, 1.9541015625, 2.507080078125, 3.06005859375, 3.613037109375, 4.166015625, 4.718994140625, 5.27197265625, 5.824951171875, 6.3779296875, 6.930908203125, 7.48388671875, 8.036865234375, 8.58984375, 9.142822265625, 9.69580078125, 10.248779296875, 10.8017578125, 11.354736328125, 11.90771484375, 12.460693359375, 13.013671875, 13.566650390625, 14.11962890625, 14.672607421875, 15.2255859375, 15.778564453125, 16.33154296875, 16.884521484375, 17.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 5.0, 7.0, 6.0, 17.0, 16.0, 17.0, 21.0, 14.0, 22.0, 24.0, 29.0, 34.0, 32.0, 28.0, 37.0, 35.0, 35.0, 27.0, 40.0, 40.0, 44.0, 43.0, 34.0, 36.0, 35.0, 32.0, 41.0, 32.0, 25.0, 19.0, 23.0, 16.0, 27.0, 17.0, 13.0, 8.0, 15.0, 4.0, 5.0, 12.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.8125, -19.20849609375, -18.6044921875, -18.00048828125, -17.396484375, -16.79248046875, -16.1884765625, -15.58447265625, -14.98046875, -14.37646484375, -13.7724609375, -13.16845703125, -12.564453125, -11.96044921875, -11.3564453125, -10.75244140625, -10.1484375, -9.54443359375, -8.9404296875, -8.33642578125, -7.732421875, -7.12841796875, -6.5244140625, -5.92041015625, -5.31640625, -4.71240234375, -4.1083984375, -3.50439453125, -2.900390625, -2.29638671875, -1.6923828125, -1.08837890625, -0.484375, 0.11962890625, 0.7236328125, 1.32763671875, 1.931640625, 2.53564453125, 3.1396484375, 3.74365234375, 4.34765625, 4.95166015625, 5.5556640625, 6.15966796875, 6.763671875, 7.36767578125, 7.9716796875, 8.57568359375, 9.1796875, 9.78369140625, 10.3876953125, 10.99169921875, 11.595703125, 12.19970703125, 12.8037109375, 13.40771484375, 14.01171875, 14.61572265625, 15.2197265625, 15.82373046875, 16.427734375, 17.03173828125, 17.6357421875, 18.23974609375, 18.84375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 6.0, 16.0, 30.0, 27.0, 49.0, 65.0, 101.0, 145.0, 244.0, 361.0, 502.0, 765.0, 1172.0, 1827.0, 2957.0, 4943.0, 8407.0, 14994.0, 27279.0, 51419.0, 96055.0, 164995.0, 219600.0, 191173.0, 118531.0, 64575.0, 34017.0, 18428.0, 10333.0, 5896.0, 3448.0, 2178.0, 1337.0, 898.0, 622.0, 387.0, 261.0, 174.0, 116.0, 75.0, 58.0, 35.0, 23.0, 9.0, 6.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.5, -23.701416015625, -22.90283203125, -22.104248046875, -21.3056640625, -20.507080078125, -19.70849609375, -18.909912109375, -18.111328125, -17.312744140625, -16.51416015625, -15.715576171875, -14.9169921875, -14.118408203125, -13.31982421875, -12.521240234375, -11.72265625, -10.924072265625, -10.12548828125, -9.326904296875, -8.5283203125, -7.729736328125, -6.93115234375, -6.132568359375, -5.333984375, -4.535400390625, -3.73681640625, -2.938232421875, -2.1396484375, -1.341064453125, -0.54248046875, 0.256103515625, 1.0546875, 1.853271484375, 2.65185546875, 3.450439453125, 4.2490234375, 5.047607421875, 5.84619140625, 6.644775390625, 7.443359375, 8.241943359375, 9.04052734375, 9.839111328125, 10.6376953125, 11.436279296875, 12.23486328125, 13.033447265625, 13.83203125, 14.630615234375, 15.42919921875, 16.227783203125, 17.0263671875, 17.824951171875, 18.62353515625, 19.422119140625, 20.220703125, 21.019287109375, 21.81787109375, 22.616455078125, 23.4150390625, 24.213623046875, 25.01220703125, 25.810791015625, 26.609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 6.0, 9.0, 8.0, 9.0, 8.0, 12.0, 11.0, 12.0, 11.0, 28.0, 22.0, 24.0, 32.0, 43.0, 31.0, 29.0, 30.0, 41.0, 35.0, 40.0, 42.0, 47.0, 37.0, 32.0, 40.0, 34.0, 27.0, 29.0, 25.0, 30.0, 28.0, 23.0, 22.0, 24.0, 24.0, 20.0, 16.0, 11.0, 14.0, 9.0, 9.0, 4.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-13.671875, -13.2803955078125, -12.888916015625, -12.4974365234375, -12.10595703125, -11.7144775390625, -11.322998046875, -10.9315185546875, -10.5400390625, -10.1485595703125, -9.757080078125, -9.3656005859375, -8.97412109375, -8.5826416015625, -8.191162109375, -7.7996826171875, -7.408203125, -7.0167236328125, -6.625244140625, -6.2337646484375, -5.84228515625, -5.4508056640625, -5.059326171875, -4.6678466796875, -4.2763671875, -3.8848876953125, -3.493408203125, -3.1019287109375, -2.71044921875, -2.3189697265625, -1.927490234375, -1.5360107421875, -1.14453125, -0.7530517578125, -0.361572265625, 0.0299072265625, 0.42138671875, 0.8128662109375, 1.204345703125, 1.5958251953125, 1.9873046875, 2.3787841796875, 2.770263671875, 3.1617431640625, 3.55322265625, 3.9447021484375, 4.336181640625, 4.7276611328125, 5.119140625, 5.5106201171875, 5.902099609375, 6.2935791015625, 6.68505859375, 7.0765380859375, 7.468017578125, 7.8594970703125, 8.2509765625, 8.6424560546875, 9.033935546875, 9.4254150390625, 9.81689453125, 10.2083740234375, 10.599853515625, 10.9913330078125, 11.3828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 11.0, 11.0, 14.0, 15.0, 15.0, 19.0, 35.0, 36.0, 60.0, 98.0, 130.0, 183.0, 300.0, 448.0, 789.0, 1266.0, 2399.0, 4583.0, 9584.0, 21539.0, 50672.0, 118650.0, 234241.0, 280066.0, 177611.0, 81607.0, 34651.0, 14770.0, 6915.0, 3404.0, 1769.0, 917.0, 564.0, 368.0, 221.0, 140.0, 124.0, 80.0, 61.0, 53.0, 35.0, 22.0, 17.0, 13.0, 10.0, 13.0, 9.0, 8.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.671875, -12.239013671875, -11.80615234375, -11.373291015625, -10.9404296875, -10.507568359375, -10.07470703125, -9.641845703125, -9.208984375, -8.776123046875, -8.34326171875, -7.910400390625, -7.4775390625, -7.044677734375, -6.61181640625, -6.178955078125, -5.74609375, -5.313232421875, -4.88037109375, -4.447509765625, -4.0146484375, -3.581787109375, -3.14892578125, -2.716064453125, -2.283203125, -1.850341796875, -1.41748046875, -0.984619140625, -0.5517578125, -0.118896484375, 0.31396484375, 0.746826171875, 1.1796875, 1.612548828125, 2.04541015625, 2.478271484375, 2.9111328125, 3.343994140625, 3.77685546875, 4.209716796875, 4.642578125, 5.075439453125, 5.50830078125, 5.941162109375, 6.3740234375, 6.806884765625, 7.23974609375, 7.672607421875, 8.10546875, 8.538330078125, 8.97119140625, 9.404052734375, 9.8369140625, 10.269775390625, 10.70263671875, 11.135498046875, 11.568359375, 12.001220703125, 12.43408203125, 12.866943359375, 13.2998046875, 13.732666015625, 14.16552734375, 14.598388671875, 15.03125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 12.0, 17.0, 23.0, 25.0, 45.0, 67.0, 70.0, 91.0, 110.0, 99.0, 98.0, 97.0, 69.0, 47.0, 36.0, 25.0, 27.0, 7.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0014801025390625, -0.0014474540948867798, -0.0014148056507110596, -0.0013821572065353394, -0.0013495087623596191, -0.001316860318183899, -0.0012842118740081787, -0.0012515634298324585, -0.0012189149856567383, -0.001186266541481018, -0.0011536180973052979, -0.0011209696531295776, -0.0010883212089538574, -0.0010556727647781372, -0.001023024320602417, -0.0009903758764266968, -0.0009577274322509766, -0.0009250789880752563, -0.0008924305438995361, -0.0008597820997238159, -0.0008271336555480957, -0.0007944852113723755, -0.0007618367671966553, -0.0007291883230209351, -0.0006965398788452148, -0.0006638914346694946, -0.0006312429904937744, -0.0005985945463180542, -0.000565946102142334, -0.0005332976579666138, -0.0005006492137908936, -0.00046800076961517334, -0.0004353523254394531, -0.0004027038812637329, -0.0003700554370880127, -0.0003374069929122925, -0.00030475854873657227, -0.00027211010456085205, -0.00023946166038513184, -0.00020681321620941162, -0.0001741647720336914, -0.0001415163278579712, -0.00010886788368225098, -7.621943950653076e-05, -4.357099533081055e-05, -1.0922551155090332e-05, 2.1725893020629883e-05, 5.43743371963501e-05, 8.702278137207031e-05, 0.00011967122554779053, 0.00015231966972351074, 0.00018496811389923096, 0.00021761655807495117, 0.0002502650022506714, 0.0002829134464263916, 0.0003155618906021118, 0.00034821033477783203, 0.00038085877895355225, 0.00041350722312927246, 0.0004461556673049927, 0.0004788041114807129, 0.0005114525556564331, 0.0005441009998321533, 0.0005767494440078735, 0.0006093978881835938]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 20.0, 28.0, 27.0, 40.0, 60.0, 75.0, 138.0, 238.0, 364.0, 543.0, 1009.0, 1716.0, 3012.0, 5486.0, 10271.0, 19542.0, 37078.0, 68026.0, 114821.0, 165041.0, 188782.0, 166105.0, 116008.0, 68772.0, 37992.0, 19718.0, 10542.0, 5534.0, 3084.0, 1743.0, 1013.0, 618.0, 374.0, 242.0, 137.0, 106.0, 72.0, 53.0, 35.0, 21.0, 17.0, 14.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-12.109375, -11.748046875, -11.38671875, -11.025390625, -10.6640625, -10.302734375, -9.94140625, -9.580078125, -9.21875, -8.857421875, -8.49609375, -8.134765625, -7.7734375, -7.412109375, -7.05078125, -6.689453125, -6.328125, -5.966796875, -5.60546875, -5.244140625, -4.8828125, -4.521484375, -4.16015625, -3.798828125, -3.4375, -3.076171875, -2.71484375, -2.353515625, -1.9921875, -1.630859375, -1.26953125, -0.908203125, -0.546875, -0.185546875, 0.17578125, 0.537109375, 0.8984375, 1.259765625, 1.62109375, 1.982421875, 2.34375, 2.705078125, 3.06640625, 3.427734375, 3.7890625, 4.150390625, 4.51171875, 4.873046875, 5.234375, 5.595703125, 5.95703125, 6.318359375, 6.6796875, 7.041015625, 7.40234375, 7.763671875, 8.125, 8.486328125, 8.84765625, 9.208984375, 9.5703125, 9.931640625, 10.29296875, 10.654296875, 11.015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 7.0, 6.0, 7.0, 4.0, 14.0, 10.0, 15.0, 20.0, 23.0, 18.0, 30.0, 31.0, 36.0, 44.0, 42.0, 39.0, 60.0, 56.0, 50.0, 29.0, 42.0, 47.0, 47.0, 34.0, 42.0, 29.0, 30.0, 31.0, 29.0, 26.0, 19.0, 15.0, 11.0, 14.0, 12.0, 4.0, 2.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-3.375, -3.2701416015625, -3.165283203125, -3.0604248046875, -2.95556640625, -2.8507080078125, -2.745849609375, -2.6409912109375, -2.5361328125, -2.4312744140625, -2.326416015625, -2.2215576171875, -2.11669921875, -2.0118408203125, -1.906982421875, -1.8021240234375, -1.697265625, -1.5924072265625, -1.487548828125, -1.3826904296875, -1.27783203125, -1.1729736328125, -1.068115234375, -0.9632568359375, -0.8583984375, -0.7535400390625, -0.648681640625, -0.5438232421875, -0.43896484375, -0.3341064453125, -0.229248046875, -0.1243896484375, -0.01953125, 0.0853271484375, 0.190185546875, 0.2950439453125, 0.39990234375, 0.5047607421875, 0.609619140625, 0.7144775390625, 0.8193359375, 0.9241943359375, 1.029052734375, 1.1339111328125, 1.23876953125, 1.3436279296875, 1.448486328125, 1.5533447265625, 1.658203125, 1.7630615234375, 1.867919921875, 1.9727783203125, 2.07763671875, 2.1824951171875, 2.287353515625, 2.3922119140625, 2.4970703125, 2.6019287109375, 2.706787109375, 2.8116455078125, 2.91650390625, 3.0213623046875, 3.126220703125, 3.2310791015625, 3.3359375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 6.0, 4.0, 3.0, 13.0, 16.0, 19.0, 17.0, 16.0, 27.0, 21.0, 34.0, 30.0, 32.0, 30.0, 32.0, 39.0, 40.0, 43.0, 52.0, 33.0, 37.0, 39.0, 36.0, 35.0, 41.0, 35.0, 28.0, 30.0, 28.0, 23.0, 21.0, 24.0, 20.0, 17.0, 10.0, 15.0, 5.0, 5.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-19.37145233154297, -18.785348892211914, -18.199243545532227, -17.613140106201172, -17.027034759521484, -16.44093132019043, -15.854826927185059, -15.268722534179688, -14.682618141174316, -14.096513748168945, -13.510409355163574, -12.924304962158203, -12.338201522827148, -11.752096176147461, -11.165992736816406, -10.579888343811035, -9.993783950805664, -9.407679557800293, -8.821575164794922, -8.23547077178955, -7.649366855621338, -7.063262462615967, -6.477158546447754, -5.891054153442383, -5.304949760437012, -4.718845367431641, -4.1327409744262695, -3.5466370582580566, -2.9605326652526855, -2.3744282722473145, -1.7883241176605225, -1.2022199630737305, -0.6161174774169922, -0.030013203620910645, 0.5560910701751709, 1.1421953439712524, 1.728299617767334, 2.314404010772705, 2.900508165359497, 3.486612319946289, 4.07271671295166, 4.658821105957031, 5.244925498962402, 5.831029415130615, 6.417133808135986, 7.003238201141357, 7.58934211730957, 8.175446510314941, 8.761550903320312, 9.347655296325684, 9.933759689331055, 10.519864082336426, 11.105968475341797, 11.692071914672852, 12.278176307678223, 12.864280700683594, 13.450385093688965, 14.036489486694336, 14.622593879699707, 15.208698272705078, 15.794801712036133, 16.38090705871582, 16.967010498046875, 17.553115844726562, 18.139219284057617]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 11.0, 14.0, 13.0, 17.0, 13.0, 22.0, 23.0, 15.0, 25.0, 31.0, 25.0, 29.0, 31.0, 39.0, 43.0, 54.0, 39.0, 43.0, 34.0, 33.0, 40.0, 38.0, 34.0, 38.0, 26.0, 36.0, 30.0, 18.0, 31.0, 24.0, 17.0, 10.0, 15.0, 13.0, 8.0, 15.0, 11.0, 6.0, 4.0, 4.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.518085479736328, -17.92317771911621, -17.32826805114746, -16.733360290527344, -16.138450622558594, -15.543542861938477, -14.948634147644043, -14.35372543334961, -13.758816719055176, -13.163908004760742, -12.568999290466309, -11.974090576171875, -11.379182815551758, -10.784273147583008, -10.18936538696289, -9.594456672668457, -8.999547958374023, -8.40463924407959, -7.809730529785156, -7.214822292327881, -6.619913578033447, -6.025004863739014, -5.430096626281738, -4.835187911987305, -4.240279197692871, -3.6453704833984375, -3.050462007522583, -2.4555535316467285, -1.860644817352295, -1.2657361030578613, -0.6708276271820068, -0.07591915130615234, 0.5189895629882812, 1.1138981580734253, 1.7088067531585693, 2.303715229034424, 2.8986239433288574, 3.493532657623291, 4.088440895080566, 4.683349609375, 5.278258323669434, 5.873167037963867, 6.468075752258301, 7.062983989715576, 7.65789270401001, 8.252801895141602, 8.847709655761719, 9.442618370056152, 10.037527084350586, 10.63243579864502, 11.227344512939453, 11.822253227233887, 12.41716194152832, 13.012069702148438, 13.606978416442871, 14.201887130737305, 14.796795845031738, 15.391704559326172, 15.986613273620605, 16.58152198791504, 17.176429748535156, 17.771339416503906, 18.366247177124023, 18.96115493774414, 19.55606460571289]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 9.0, 9.0, 5.0, 7.0, 18.0, 37.0, 58.0, 93.0, 154.0, 250.0, 359.0, 622.0, 896.0, 1452.0, 2230.0, 3558.0, 5665.0, 8499.0, 12962.0, 18995.0, 27319.0, 37657.0, 50852.0, 65358.0, 79088.0, 91487.0, 98748.0, 100022.0, 94893.0, 84147.0, 70648.0, 55604.0, 42006.0, 30569.0, 21305.0, 15006.0, 9967.0, 6336.0, 4236.0, 2733.0, 1697.0, 1104.0, 698.0, 443.0, 283.0, 180.0, 118.0, 76.0, 46.0, 33.0, 14.0, 5.0, 2.0, 3.0, 3.0, 3.0], "bins": [-12.890625, -12.524169921875, -12.15771484375, -11.791259765625, -11.4248046875, -11.058349609375, -10.69189453125, -10.325439453125, -9.958984375, -9.592529296875, -9.22607421875, -8.859619140625, -8.4931640625, -8.126708984375, -7.76025390625, -7.393798828125, -7.02734375, -6.660888671875, -6.29443359375, -5.927978515625, -5.5615234375, -5.195068359375, -4.82861328125, -4.462158203125, -4.095703125, -3.729248046875, -3.36279296875, -2.996337890625, -2.6298828125, -2.263427734375, -1.89697265625, -1.530517578125, -1.1640625, -0.797607421875, -0.43115234375, -0.064697265625, 0.3017578125, 0.668212890625, 1.03466796875, 1.401123046875, 1.767578125, 2.134033203125, 2.50048828125, 2.866943359375, 3.2333984375, 3.599853515625, 3.96630859375, 4.332763671875, 4.69921875, 5.065673828125, 5.43212890625, 5.798583984375, 6.1650390625, 6.531494140625, 6.89794921875, 7.264404296875, 7.630859375, 7.997314453125, 8.36376953125, 8.730224609375, 9.0966796875, 9.463134765625, 9.82958984375, 10.196044921875, 10.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 4.0, 5.0, 13.0, 15.0, 17.0, 17.0, 14.0, 17.0, 21.0, 24.0, 21.0, 33.0, 35.0, 36.0, 32.0, 40.0, 41.0, 46.0, 43.0, 52.0, 43.0, 44.0, 27.0, 46.0, 46.0, 32.0, 35.0, 19.0, 25.0, 17.0, 22.0, 17.0, 16.0, 10.0, 17.0, 9.0, 4.0, 12.0, 2.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.15625, -20.51318359375, -19.8701171875, -19.22705078125, -18.583984375, -17.94091796875, -17.2978515625, -16.65478515625, -16.01171875, -15.36865234375, -14.7255859375, -14.08251953125, -13.439453125, -12.79638671875, -12.1533203125, -11.51025390625, -10.8671875, -10.22412109375, -9.5810546875, -8.93798828125, -8.294921875, -7.65185546875, -7.0087890625, -6.36572265625, -5.72265625, -5.07958984375, -4.4365234375, -3.79345703125, -3.150390625, -2.50732421875, -1.8642578125, -1.22119140625, -0.578125, 0.06494140625, 0.7080078125, 1.35107421875, 1.994140625, 2.63720703125, 3.2802734375, 3.92333984375, 4.56640625, 5.20947265625, 5.8525390625, 6.49560546875, 7.138671875, 7.78173828125, 8.4248046875, 9.06787109375, 9.7109375, 10.35400390625, 10.9970703125, 11.64013671875, 12.283203125, 12.92626953125, 13.5693359375, 14.21240234375, 14.85546875, 15.49853515625, 16.1416015625, 16.78466796875, 17.427734375, 18.07080078125, 18.7138671875, 19.35693359375, 20.0]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 8.0, 8.0, 12.0, 15.0, 29.0, 37.0, 77.0, 132.0, 179.0, 308.0, 478.0, 788.0, 1295.0, 2062.0, 3356.0, 5230.0, 8353.0, 13357.0, 20718.0, 30946.0, 45040.0, 62648.0, 82297.0, 100138.0, 112466.0, 115761.0, 109417.0, 92871.0, 73649.0, 55149.0, 38543.0, 26096.0, 17199.0, 11216.0, 6918.0, 4509.0, 2750.0, 1648.0, 1069.0, 673.0, 416.0, 265.0, 157.0, 99.0, 65.0, 52.0, 24.0, 22.0, 5.0, 4.0, 5.0, 3.0, 2.0], "bins": [-16.078125, -15.6351318359375, -15.192138671875, -14.7491455078125, -14.30615234375, -13.8631591796875, -13.420166015625, -12.9771728515625, -12.5341796875, -12.0911865234375, -11.648193359375, -11.2052001953125, -10.76220703125, -10.3192138671875, -9.876220703125, -9.4332275390625, -8.990234375, -8.5472412109375, -8.104248046875, -7.6612548828125, -7.21826171875, -6.7752685546875, -6.332275390625, -5.8892822265625, -5.4462890625, -5.0032958984375, -4.560302734375, -4.1173095703125, -3.67431640625, -3.2313232421875, -2.788330078125, -2.3453369140625, -1.90234375, -1.4593505859375, -1.016357421875, -0.5733642578125, -0.13037109375, 0.3126220703125, 0.755615234375, 1.1986083984375, 1.6416015625, 2.0845947265625, 2.527587890625, 2.9705810546875, 3.41357421875, 3.8565673828125, 4.299560546875, 4.7425537109375, 5.185546875, 5.6285400390625, 6.071533203125, 6.5145263671875, 6.95751953125, 7.4005126953125, 7.843505859375, 8.2864990234375, 8.7294921875, 9.1724853515625, 9.615478515625, 10.0584716796875, 10.50146484375, 10.9444580078125, 11.387451171875, 11.8304443359375, 12.2734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 9.0, 4.0, 8.0, 8.0, 12.0, 15.0, 15.0, 14.0, 22.0, 32.0, 19.0, 28.0, 30.0, 29.0, 33.0, 38.0, 44.0, 43.0, 35.0, 39.0, 40.0, 48.0, 33.0, 38.0, 35.0, 40.0, 25.0, 29.0, 33.0, 35.0, 29.0, 19.0, 19.0, 16.0, 18.0, 18.0, 11.0, 5.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0], "bins": [-14.40625, -13.9954833984375, -13.584716796875, -13.1739501953125, -12.76318359375, -12.3524169921875, -11.941650390625, -11.5308837890625, -11.1201171875, -10.7093505859375, -10.298583984375, -9.8878173828125, -9.47705078125, -9.0662841796875, -8.655517578125, -8.2447509765625, -7.833984375, -7.4232177734375, -7.012451171875, -6.6016845703125, -6.19091796875, -5.7801513671875, -5.369384765625, -4.9586181640625, -4.5478515625, -4.1370849609375, -3.726318359375, -3.3155517578125, -2.90478515625, -2.4940185546875, -2.083251953125, -1.6724853515625, -1.26171875, -0.8509521484375, -0.440185546875, -0.0294189453125, 0.38134765625, 0.7921142578125, 1.202880859375, 1.6136474609375, 2.0244140625, 2.4351806640625, 2.845947265625, 3.2567138671875, 3.66748046875, 4.0782470703125, 4.489013671875, 4.8997802734375, 5.310546875, 5.7213134765625, 6.132080078125, 6.5428466796875, 6.95361328125, 7.3643798828125, 7.775146484375, 8.1859130859375, 8.5966796875, 9.0074462890625, 9.418212890625, 9.8289794921875, 10.23974609375, 10.6505126953125, 11.061279296875, 11.4720458984375, 11.8828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 13.0, 18.0, 25.0, 31.0, 55.0, 81.0, 113.0, 213.0, 388.0, 615.0, 950.0, 1711.0, 3022.0, 5408.0, 9319.0, 16251.0, 28101.0, 46684.0, 72907.0, 104587.0, 132440.0, 147421.0, 140793.0, 116196.0, 84468.0, 55372.0, 34389.0, 20085.0, 11506.0, 6491.0, 3749.0, 2056.0, 1265.0, 720.0, 441.0, 240.0, 154.0, 92.0, 66.0, 38.0, 29.0, 22.0, 14.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.71484375, -6.49603271484375, -6.2772216796875, -6.05841064453125, -5.839599609375, -5.62078857421875, -5.4019775390625, -5.18316650390625, -4.96435546875, -4.74554443359375, -4.5267333984375, -4.30792236328125, -4.089111328125, -3.87030029296875, -3.6514892578125, -3.43267822265625, -3.2138671875, -2.99505615234375, -2.7762451171875, -2.55743408203125, -2.338623046875, -2.11981201171875, -1.9010009765625, -1.68218994140625, -1.46337890625, -1.24456787109375, -1.0257568359375, -0.80694580078125, -0.588134765625, -0.36932373046875, -0.1505126953125, 0.06829833984375, 0.287109375, 0.50592041015625, 0.7247314453125, 0.94354248046875, 1.162353515625, 1.38116455078125, 1.5999755859375, 1.81878662109375, 2.03759765625, 2.25640869140625, 2.4752197265625, 2.69403076171875, 2.912841796875, 3.13165283203125, 3.3504638671875, 3.56927490234375, 3.7880859375, 4.00689697265625, 4.2257080078125, 4.44451904296875, 4.663330078125, 4.88214111328125, 5.1009521484375, 5.31976318359375, 5.53857421875, 5.75738525390625, 5.9761962890625, 6.19500732421875, 6.413818359375, 6.63262939453125, 6.8514404296875, 7.07025146484375, 7.2890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 3.0, 11.0, 12.0, 6.0, 9.0, 14.0, 14.0, 21.0, 20.0, 26.0, 21.0, 26.0, 46.0, 36.0, 38.0, 48.0, 34.0, 41.0, 44.0, 45.0, 44.0, 38.0, 45.0, 41.0, 35.0, 34.0, 45.0, 21.0, 29.0, 22.0, 25.0, 25.0, 12.0, 16.0, 13.0, 10.0, 6.0, 11.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007143020629882812, -0.0006935968995094299, -0.0006728917360305786, -0.0006521865725517273, -0.000631481409072876, -0.0006107762455940247, -0.0005900710821151733, -0.000569365918636322, -0.0005486607551574707, -0.0005279555916786194, -0.0005072504281997681, -0.00048654526472091675, -0.00046584010124206543, -0.0004451349377632141, -0.0004244297742843628, -0.0004037246108055115, -0.00038301944732666016, -0.00036231428384780884, -0.0003416091203689575, -0.0003209039568901062, -0.0003001987934112549, -0.00027949362993240356, -0.00025878846645355225, -0.00023808330297470093, -0.0002173781394958496, -0.0001966729760169983, -0.00017596781253814697, -0.00015526264905929565, -0.00013455748558044434, -0.00011385232210159302, -9.31471586227417e-05, -7.244199514389038e-05, -5.173683166503906e-05, -3.1031668186187744e-05, -1.0326504707336426e-05, 1.0378658771514893e-05, 3.108382225036621e-05, 5.178898572921753e-05, 7.249414920806885e-05, 9.319931268692017e-05, 0.00011390447616577148, 0.0001346096396446228, 0.00015531480312347412, 0.00017601996660232544, 0.00019672513008117676, 0.00021743029356002808, 0.0002381354570388794, 0.0002588406205177307, 0.00027954578399658203, 0.00030025094747543335, 0.00032095611095428467, 0.000341661274433136, 0.0003623664379119873, 0.0003830716013908386, 0.00040377676486968994, 0.00042448192834854126, 0.0004451870918273926, 0.0004658922553062439, 0.0004865974187850952, 0.0005073025822639465, 0.0005280077457427979, 0.0005487129092216492, 0.0005694180727005005, 0.0005901232361793518, 0.0006108283996582031]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 4.0, 9.0, 24.0, 26.0, 35.0, 72.0, 112.0, 144.0, 271.0, 460.0, 712.0, 1167.0, 1907.0, 3113.0, 5311.0, 8603.0, 13405.0, 21509.0, 33518.0, 49506.0, 69459.0, 92897.0, 111757.0, 122884.0, 121686.0, 108175.0, 88043.0, 65511.0, 46097.0, 30355.0, 19739.0, 12290.0, 7670.0, 4709.0, 2887.0, 1734.0, 1037.0, 662.0, 380.0, 270.0, 146.0, 102.0, 62.0, 24.0, 25.0, 23.0, 11.0, 8.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6953125, -5.510986328125, -5.32666015625, -5.142333984375, -4.9580078125, -4.773681640625, -4.58935546875, -4.405029296875, -4.220703125, -4.036376953125, -3.85205078125, -3.667724609375, -3.4833984375, -3.299072265625, -3.11474609375, -2.930419921875, -2.74609375, -2.561767578125, -2.37744140625, -2.193115234375, -2.0087890625, -1.824462890625, -1.64013671875, -1.455810546875, -1.271484375, -1.087158203125, -0.90283203125, -0.718505859375, -0.5341796875, -0.349853515625, -0.16552734375, 0.018798828125, 0.203125, 0.387451171875, 0.57177734375, 0.756103515625, 0.9404296875, 1.124755859375, 1.30908203125, 1.493408203125, 1.677734375, 1.862060546875, 2.04638671875, 2.230712890625, 2.4150390625, 2.599365234375, 2.78369140625, 2.968017578125, 3.15234375, 3.336669921875, 3.52099609375, 3.705322265625, 3.8896484375, 4.073974609375, 4.25830078125, 4.442626953125, 4.626953125, 4.811279296875, 4.99560546875, 5.179931640625, 5.3642578125, 5.548583984375, 5.73291015625, 5.917236328125, 6.1015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 4.0, 21.0, 17.0, 27.0, 15.0, 21.0, 36.0, 40.0, 44.0, 52.0, 50.0, 58.0, 57.0, 56.0, 70.0, 66.0, 46.0, 45.0, 40.0, 47.0, 26.0, 30.0, 26.0, 22.0, 16.0, 17.0, 9.0, 11.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.810546875, -2.70953369140625, -2.6085205078125, -2.50750732421875, -2.406494140625, -2.30548095703125, -2.2044677734375, -2.10345458984375, -2.00244140625, -1.90142822265625, -1.8004150390625, -1.69940185546875, -1.598388671875, -1.49737548828125, -1.3963623046875, -1.29534912109375, -1.1943359375, -1.09332275390625, -0.9923095703125, -0.89129638671875, -0.790283203125, -0.68927001953125, -0.5882568359375, -0.48724365234375, -0.38623046875, -0.28521728515625, -0.1842041015625, -0.08319091796875, 0.017822265625, 0.11883544921875, 0.2198486328125, 0.32086181640625, 0.421875, 0.52288818359375, 0.6239013671875, 0.72491455078125, 0.825927734375, 0.92694091796875, 1.0279541015625, 1.12896728515625, 1.22998046875, 1.33099365234375, 1.4320068359375, 1.53302001953125, 1.634033203125, 1.73504638671875, 1.8360595703125, 1.93707275390625, 2.0380859375, 2.13909912109375, 2.2401123046875, 2.34112548828125, 2.442138671875, 2.54315185546875, 2.6441650390625, 2.74517822265625, 2.84619140625, 2.94720458984375, 3.0482177734375, 3.14923095703125, 3.250244140625, 3.35125732421875, 3.4522705078125, 3.55328369140625, 3.654296875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 8.0, 7.0, 3.0, 10.0, 9.0, 11.0, 13.0, 15.0, 21.0, 21.0, 33.0, 30.0, 36.0, 46.0, 36.0, 41.0, 45.0, 44.0, 46.0, 46.0, 43.0, 42.0, 41.0, 40.0, 42.0, 35.0, 41.0, 27.0, 28.0, 27.0, 22.0, 20.0, 10.0, 17.0, 13.0, 7.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.684804916381836, -20.044353485107422, -19.40390396118164, -18.763452529907227, -18.123001098632812, -17.48255157470703, -16.842100143432617, -16.201648712158203, -15.561198234558105, -14.920747756958008, -14.280296325683594, -13.639845848083496, -12.999395370483398, -12.358943939208984, -11.718493461608887, -11.078042984008789, -10.437591552734375, -9.797141075134277, -9.156689643859863, -8.516239166259766, -7.87578821182251, -7.235337257385254, -6.594886779785156, -5.9544358253479, -5.3139848709106445, -4.673533916473389, -4.033082962036133, -3.392632484436035, -2.7521815299987793, -2.1117305755615234, -1.4712798595428467, -0.8308291435241699, -0.19037818908691406, 0.45007264614105225, 1.0905234813690186, 1.7309743165969849, 2.371425151824951, 3.011876106262207, 3.652326822280884, 4.2927775382995605, 4.933228492736816, 5.573679447174072, 6.214130401611328, 6.854580879211426, 7.495031833648682, 8.135482788085938, 8.775933265686035, 9.416383743286133, 10.056835174560547, 10.697285652160645, 11.337737083435059, 11.978187561035156, 12.61863899230957, 13.259089469909668, 13.899539947509766, 14.53999137878418, 15.180441856384277, 15.820892333984375, 16.46134376525879, 17.101795196533203, 17.742244720458984, 18.3826961517334, 19.023147583007812, 19.663597106933594, 20.304048538208008]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 6.0, 6.0, 1.0, 6.0, 2.0, 12.0, 7.0, 10.0, 4.0, 12.0, 12.0, 18.0, 27.0, 16.0, 23.0, 17.0, 36.0, 35.0, 27.0, 26.0, 24.0, 33.0, 32.0, 30.0, 35.0, 34.0, 39.0, 42.0, 36.0, 40.0, 34.0, 27.0, 22.0, 32.0, 25.0, 20.0, 21.0, 18.0, 23.0, 18.0, 24.0, 9.0, 11.0, 14.0, 13.0, 9.0, 4.0, 8.0, 12.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 3.0], "bins": [-18.1922550201416, -17.644514083862305, -17.096773147583008, -16.549034118652344, -16.001293182373047, -15.45355224609375, -14.905811309814453, -14.358071327209473, -13.810331344604492, -13.262590408325195, -12.714850425720215, -12.167109489440918, -11.619369506835938, -11.07162857055664, -10.523887634277344, -9.976147651672363, -9.428406715393066, -8.88066577911377, -8.332925796508789, -7.785184860229492, -7.237444877624512, -6.689703941345215, -6.141963481903076, -5.5942230224609375, -5.046482563018799, -4.49874210357666, -3.9510016441345215, -3.4032609462738037, -2.855520486831665, -2.3077800273895264, -1.7600393295288086, -1.21229887008667, -0.6645584106445312, -0.1168178915977478, 0.43092262744903564, 0.9786632061004639, 1.5264036655426025, 2.074144124984741, 2.621884822845459, 3.1696252822875977, 3.7173657417297363, 4.265106201171875, 4.812846660614014, 5.360587120056152, 5.908328056335449, 6.45606803894043, 7.003808975219727, 7.551549434661865, 8.099289894104004, 8.6470308303833, 9.194770812988281, 9.742511749267578, 10.290251731872559, 10.837992668151855, 11.385732650756836, 11.933473587036133, 12.48121452331543, 13.028955459594727, 13.576695442199707, 14.124436378479004, 14.672176361083984, 15.219917297363281, 15.767658233642578, 16.315399169921875, 16.86313819885254]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 3.0, 7.0, 12.0, 21.0, 31.0, 42.0, 42.0, 75.0, 134.0, 176.0, 300.0, 454.0, 605.0, 1071.0, 1754.0, 2932.0, 4875.0, 8463.0, 14297.0, 24930.0, 44612.0, 81004.0, 146377.0, 257791.0, 424279.0, 608296.0, 709087.0, 654612.0, 488808.0, 310605.0, 179712.0, 100695.0, 55392.0, 30786.0, 17541.0, 10132.0, 5765.0, 3273.0, 2025.0, 1301.0, 694.0, 455.0, 277.0, 174.0, 130.0, 71.0, 49.0, 33.0, 22.0, 22.0, 14.0, 10.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.25, -15.702392578125, -15.15478515625, -14.607177734375, -14.0595703125, -13.511962890625, -12.96435546875, -12.416748046875, -11.869140625, -11.321533203125, -10.77392578125, -10.226318359375, -9.6787109375, -9.131103515625, -8.58349609375, -8.035888671875, -7.48828125, -6.940673828125, -6.39306640625, -5.845458984375, -5.2978515625, -4.750244140625, -4.20263671875, -3.655029296875, -3.107421875, -2.559814453125, -2.01220703125, -1.464599609375, -0.9169921875, -0.369384765625, 0.17822265625, 0.725830078125, 1.2734375, 1.821044921875, 2.36865234375, 2.916259765625, 3.4638671875, 4.011474609375, 4.55908203125, 5.106689453125, 5.654296875, 6.201904296875, 6.74951171875, 7.297119140625, 7.8447265625, 8.392333984375, 8.93994140625, 9.487548828125, 10.03515625, 10.582763671875, 11.13037109375, 11.677978515625, 12.2255859375, 12.773193359375, 13.32080078125, 13.868408203125, 14.416015625, 14.963623046875, 15.51123046875, 16.058837890625, 16.6064453125, 17.154052734375, 17.70166015625, 18.249267578125, 18.796875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 4.0, 9.0, 6.0, 8.0, 6.0, 6.0, 10.0, 7.0, 15.0, 16.0, 9.0, 20.0, 18.0, 20.0, 27.0, 39.0, 24.0, 27.0, 31.0, 40.0, 30.0, 36.0, 33.0, 29.0, 39.0, 35.0, 37.0, 29.0, 39.0, 25.0, 29.0, 36.0, 21.0, 33.0, 23.0, 24.0, 14.0, 19.0, 16.0, 21.0, 11.0, 15.0, 9.0, 5.0, 15.0, 5.0, 5.0, 8.0, 1.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0], "bins": [-15.1796875, -14.712158203125, -14.24462890625, -13.777099609375, -13.3095703125, -12.842041015625, -12.37451171875, -11.906982421875, -11.439453125, -10.971923828125, -10.50439453125, -10.036865234375, -9.5693359375, -9.101806640625, -8.63427734375, -8.166748046875, -7.69921875, -7.231689453125, -6.76416015625, -6.296630859375, -5.8291015625, -5.361572265625, -4.89404296875, -4.426513671875, -3.958984375, -3.491455078125, -3.02392578125, -2.556396484375, -2.0888671875, -1.621337890625, -1.15380859375, -0.686279296875, -0.21875, 0.248779296875, 0.71630859375, 1.183837890625, 1.6513671875, 2.118896484375, 2.58642578125, 3.053955078125, 3.521484375, 3.989013671875, 4.45654296875, 4.924072265625, 5.3916015625, 5.859130859375, 6.32666015625, 6.794189453125, 7.26171875, 7.729248046875, 8.19677734375, 8.664306640625, 9.1318359375, 9.599365234375, 10.06689453125, 10.534423828125, 11.001953125, 11.469482421875, 11.93701171875, 12.404541015625, 12.8720703125, 13.339599609375, 13.80712890625, 14.274658203125, 14.7421875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 9.0, 6.0, 7.0, 19.0, 25.0, 25.0, 55.0, 77.0, 128.0, 208.0, 360.0, 526.0, 991.0, 1551.0, 2611.0, 4601.0, 8057.0, 13929.0, 24518.0, 42949.0, 75780.0, 130674.0, 219840.0, 351080.0, 510467.0, 638458.0, 652883.0, 541545.0, 384106.0, 244037.0, 146687.0, 84562.0, 48585.0, 27630.0, 15597.0, 8944.0, 5064.0, 3035.0, 1803.0, 1060.0, 675.0, 431.0, 279.0, 155.0, 101.0, 66.0, 35.0, 17.0, 12.0, 10.0, 9.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.52294921875, -16.9208984375, -16.31884765625, -15.716796875, -15.11474609375, -14.5126953125, -13.91064453125, -13.30859375, -12.70654296875, -12.1044921875, -11.50244140625, -10.900390625, -10.29833984375, -9.6962890625, -9.09423828125, -8.4921875, -7.89013671875, -7.2880859375, -6.68603515625, -6.083984375, -5.48193359375, -4.8798828125, -4.27783203125, -3.67578125, -3.07373046875, -2.4716796875, -1.86962890625, -1.267578125, -0.66552734375, -0.0634765625, 0.53857421875, 1.140625, 1.74267578125, 2.3447265625, 2.94677734375, 3.548828125, 4.15087890625, 4.7529296875, 5.35498046875, 5.95703125, 6.55908203125, 7.1611328125, 7.76318359375, 8.365234375, 8.96728515625, 9.5693359375, 10.17138671875, 10.7734375, 11.37548828125, 11.9775390625, 12.57958984375, 13.181640625, 13.78369140625, 14.3857421875, 14.98779296875, 15.58984375, 16.19189453125, 16.7939453125, 17.39599609375, 17.998046875, 18.60009765625, 19.2021484375, 19.80419921875, 20.40625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 2.0, 8.0, 11.0, 22.0, 24.0, 25.0, 34.0, 28.0, 43.0, 54.0, 65.0, 82.0, 101.0, 126.0, 158.0, 159.0, 171.0, 199.0, 200.0, 212.0, 224.0, 229.0, 214.0, 221.0, 204.0, 189.0, 168.0, 172.0, 121.0, 120.0, 93.0, 78.0, 66.0, 61.0, 53.0, 30.0, 20.0, 22.0, 13.0, 14.0, 7.0, 6.0, 8.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.8046875, -7.56939697265625, -7.3341064453125, -7.09881591796875, -6.863525390625, -6.62823486328125, -6.3929443359375, -6.15765380859375, -5.92236328125, -5.68707275390625, -5.4517822265625, -5.21649169921875, -4.981201171875, -4.74591064453125, -4.5106201171875, -4.27532958984375, -4.0400390625, -3.80474853515625, -3.5694580078125, -3.33416748046875, -3.098876953125, -2.86358642578125, -2.6282958984375, -2.39300537109375, -2.15771484375, -1.92242431640625, -1.6871337890625, -1.45184326171875, -1.216552734375, -0.98126220703125, -0.7459716796875, -0.51068115234375, -0.275390625, -0.04010009765625, 0.1951904296875, 0.43048095703125, 0.665771484375, 0.90106201171875, 1.1363525390625, 1.37164306640625, 1.60693359375, 1.84222412109375, 2.0775146484375, 2.31280517578125, 2.548095703125, 2.78338623046875, 3.0186767578125, 3.25396728515625, 3.4892578125, 3.72454833984375, 3.9598388671875, 4.19512939453125, 4.430419921875, 4.66571044921875, 4.9010009765625, 5.13629150390625, 5.37158203125, 5.60687255859375, 5.8421630859375, 6.07745361328125, 6.312744140625, 6.54803466796875, 6.7833251953125, 7.01861572265625, 7.25390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 8.0, 9.0, 12.0, 12.0, 16.0, 19.0, 27.0, 20.0, 31.0, 25.0, 41.0, 41.0, 34.0, 45.0, 35.0, 49.0, 48.0, 47.0, 45.0, 35.0, 38.0, 41.0, 42.0, 43.0, 34.0, 45.0, 22.0, 17.0, 21.0, 10.0, 12.0, 10.0, 11.0, 7.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.348783493041992, -18.72844123840332, -18.10809898376465, -17.487756729125977, -16.867414474487305, -16.247074127197266, -15.626730918884277, -15.006389617919922, -14.38604736328125, -13.765705108642578, -13.145362854003906, -12.525020599365234, -11.904679298400879, -11.284337043762207, -10.663994789123535, -10.04365348815918, -9.423310279846191, -8.80296802520752, -8.182625770568848, -7.562283992767334, -6.94194221496582, -6.321599960327148, -5.701257705688477, -5.080915927886963, -4.460573673248291, -3.8402316570281982, -3.2198896408081055, -2.5995473861694336, -1.9792053699493408, -1.358863353729248, -0.7385210990905762, -0.1181793212890625, 0.5021629333496094, 1.1225049495697021, 1.7428470849990845, 2.363189220428467, 2.9835312366485596, 3.6038732528686523, 4.224215507507324, 4.844557285308838, 5.46489953994751, 6.085241794586182, 6.705583572387695, 7.325925827026367, 7.946268081665039, 8.566610336303711, 9.186952590942383, 9.807293891906738, 10.42763614654541, 11.047978401184082, 11.668320655822754, 12.28866195678711, 12.909004211425781, 13.529346466064453, 14.149688720703125, 14.770030975341797, 15.390373229980469, 16.01071548461914, 16.631057739257812, 17.251399993896484, 17.871742248535156, 18.492084503173828, 19.1124267578125, 19.73276710510254, 20.35310935974121]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 5.0, 9.0, 7.0, 10.0, 17.0, 14.0, 16.0, 21.0, 29.0, 22.0, 27.0, 18.0, 22.0, 39.0, 38.0, 34.0, 39.0, 28.0, 35.0, 45.0, 48.0, 29.0, 36.0, 37.0, 28.0, 32.0, 33.0, 29.0, 30.0, 25.0, 18.0, 25.0, 15.0, 25.0, 14.0, 13.0, 20.0, 13.0, 6.0, 8.0, 6.0, 12.0, 5.0, 2.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.243106842041016, -17.684803009033203, -17.126497268676758, -16.568193435668945, -16.0098876953125, -15.451583862304688, -14.893280029296875, -14.334975242614746, -13.776670455932617, -13.218365669250488, -12.66006088256836, -12.101757049560547, -11.543452262878418, -10.985147476196289, -10.426843643188477, -9.868538856506348, -9.310234069824219, -8.75192928314209, -8.193624496459961, -7.635320663452148, -7.0770158767700195, -6.518711090087891, -5.96040678024292, -5.402102470397949, -4.84379768371582, -4.285492897033691, -3.7271885871887207, -3.168884038925171, -2.610579490661621, -2.0522749423980713, -1.4939703941345215, -0.9356658458709717, -0.3773632049560547, 0.18094134330749512, 0.7392458915710449, 1.2975504398345947, 1.8558549880981445, 2.4141595363616943, 2.972464084625244, 3.530768632888794, 4.089073181152344, 4.647377967834473, 5.205682277679443, 5.763986587524414, 6.322291374206543, 6.880596160888672, 7.438900470733643, 7.997204780578613, 8.555509567260742, 9.113814353942871, 9.672119140625, 10.230422973632812, 10.788727760314941, 11.34703254699707, 11.905336380004883, 12.463641166687012, 13.02194595336914, 13.58025074005127, 14.138555526733398, 14.696859359741211, 15.25516414642334, 15.813468933105469, 16.37177276611328, 16.930078506469727, 17.48838233947754]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 7.0, 6.0, 8.0, 10.0, 25.0, 36.0, 52.0, 78.0, 120.0, 215.0, 270.0, 399.0, 644.0, 992.0, 1527.0, 2510.0, 3855.0, 6334.0, 9978.0, 15828.0, 24411.0, 36783.0, 54774.0, 76475.0, 99715.0, 119583.0, 126929.0, 120479.0, 102054.0, 78598.0, 56756.0, 38787.0, 25580.0, 16264.0, 10288.0, 6728.0, 4170.0, 2596.0, 1665.0, 1054.0, 663.0, 434.0, 303.0, 198.0, 130.0, 84.0, 63.0, 42.0, 26.0, 14.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.0390625, -9.6993408203125, -9.359619140625, -9.0198974609375, -8.68017578125, -8.3404541015625, -8.000732421875, -7.6610107421875, -7.3212890625, -6.9815673828125, -6.641845703125, -6.3021240234375, -5.96240234375, -5.6226806640625, -5.282958984375, -4.9432373046875, -4.603515625, -4.2637939453125, -3.924072265625, -3.5843505859375, -3.24462890625, -2.9049072265625, -2.565185546875, -2.2254638671875, -1.8857421875, -1.5460205078125, -1.206298828125, -0.8665771484375, -0.52685546875, -0.1871337890625, 0.152587890625, 0.4923095703125, 0.83203125, 1.1717529296875, 1.511474609375, 1.8511962890625, 2.19091796875, 2.5306396484375, 2.870361328125, 3.2100830078125, 3.5498046875, 3.8895263671875, 4.229248046875, 4.5689697265625, 4.90869140625, 5.2484130859375, 5.588134765625, 5.9278564453125, 6.267578125, 6.6072998046875, 6.947021484375, 7.2867431640625, 7.62646484375, 7.9661865234375, 8.305908203125, 8.6456298828125, 8.9853515625, 9.3250732421875, 9.664794921875, 10.0045166015625, 10.34423828125, 10.6839599609375, 11.023681640625, 11.3634033203125, 11.703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 12.0, 4.0, 6.0, 9.0, 19.0, 22.0, 19.0, 16.0, 29.0, 27.0, 24.0, 30.0, 36.0, 34.0, 38.0, 40.0, 29.0, 41.0, 32.0, 44.0, 38.0, 41.0, 35.0, 32.0, 24.0, 26.0, 31.0, 28.0, 27.0, 21.0, 25.0, 16.0, 22.0, 12.0, 18.0, 14.0, 16.0, 11.0, 12.0, 6.0, 11.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-19.046875, -18.4677734375, -17.888671875, -17.3095703125, -16.73046875, -16.1513671875, -15.572265625, -14.9931640625, -14.4140625, -13.8349609375, -13.255859375, -12.6767578125, -12.09765625, -11.5185546875, -10.939453125, -10.3603515625, -9.78125, -9.2021484375, -8.623046875, -8.0439453125, -7.46484375, -6.8857421875, -6.306640625, -5.7275390625, -5.1484375, -4.5693359375, -3.990234375, -3.4111328125, -2.83203125, -2.2529296875, -1.673828125, -1.0947265625, -0.515625, 0.0634765625, 0.642578125, 1.2216796875, 1.80078125, 2.3798828125, 2.958984375, 3.5380859375, 4.1171875, 4.6962890625, 5.275390625, 5.8544921875, 6.43359375, 7.0126953125, 7.591796875, 8.1708984375, 8.75, 9.3291015625, 9.908203125, 10.4873046875, 11.06640625, 11.6455078125, 12.224609375, 12.8037109375, 13.3828125, 13.9619140625, 14.541015625, 15.1201171875, 15.69921875, 16.2783203125, 16.857421875, 17.4365234375, 18.015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 8.0, 8.0, 19.0, 24.0, 38.0, 55.0, 68.0, 98.0, 163.0, 270.0, 380.0, 652.0, 1200.0, 1896.0, 3379.0, 6312.0, 11527.0, 21728.0, 41422.0, 77417.0, 135917.0, 199172.0, 207410.0, 150265.0, 87673.0, 47248.0, 24755.0, 12941.0, 7103.0, 3864.0, 2234.0, 1253.0, 768.0, 473.0, 274.0, 179.0, 139.0, 73.0, 46.0, 40.0, 20.0, 19.0, 6.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-22.40625, -21.749267578125, -21.09228515625, -20.435302734375, -19.7783203125, -19.121337890625, -18.46435546875, -17.807373046875, -17.150390625, -16.493408203125, -15.83642578125, -15.179443359375, -14.5224609375, -13.865478515625, -13.20849609375, -12.551513671875, -11.89453125, -11.237548828125, -10.58056640625, -9.923583984375, -9.2666015625, -8.609619140625, -7.95263671875, -7.295654296875, -6.638671875, -5.981689453125, -5.32470703125, -4.667724609375, -4.0107421875, -3.353759765625, -2.69677734375, -2.039794921875, -1.3828125, -0.725830078125, -0.06884765625, 0.588134765625, 1.2451171875, 1.902099609375, 2.55908203125, 3.216064453125, 3.873046875, 4.530029296875, 5.18701171875, 5.843994140625, 6.5009765625, 7.157958984375, 7.81494140625, 8.471923828125, 9.12890625, 9.785888671875, 10.44287109375, 11.099853515625, 11.7568359375, 12.413818359375, 13.07080078125, 13.727783203125, 14.384765625, 15.041748046875, 15.69873046875, 16.355712890625, 17.0126953125, 17.669677734375, 18.32666015625, 18.983642578125, 19.640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 5.0, 5.0, 7.0, 14.0, 17.0, 21.0, 24.0, 24.0, 35.0, 24.0, 33.0, 27.0, 40.0, 32.0, 37.0, 52.0, 39.0, 40.0, 41.0, 59.0, 42.0, 44.0, 39.0, 45.0, 34.0, 36.0, 22.0, 27.0, 35.0, 23.0, 13.0, 11.0, 4.0, 13.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9296875, -12.4833984375, -12.037109375, -11.5908203125, -11.14453125, -10.6982421875, -10.251953125, -9.8056640625, -9.359375, -8.9130859375, -8.466796875, -8.0205078125, -7.57421875, -7.1279296875, -6.681640625, -6.2353515625, -5.7890625, -5.3427734375, -4.896484375, -4.4501953125, -4.00390625, -3.5576171875, -3.111328125, -2.6650390625, -2.21875, -1.7724609375, -1.326171875, -0.8798828125, -0.43359375, 0.0126953125, 0.458984375, 0.9052734375, 1.3515625, 1.7978515625, 2.244140625, 2.6904296875, 3.13671875, 3.5830078125, 4.029296875, 4.4755859375, 4.921875, 5.3681640625, 5.814453125, 6.2607421875, 6.70703125, 7.1533203125, 7.599609375, 8.0458984375, 8.4921875, 8.9384765625, 9.384765625, 9.8310546875, 10.27734375, 10.7236328125, 11.169921875, 11.6162109375, 12.0625, 12.5087890625, 12.955078125, 13.4013671875, 13.84765625, 14.2939453125, 14.740234375, 15.1865234375, 15.6328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 9.0, 6.0, 9.0, 13.0, 32.0, 31.0, 49.0, 88.0, 117.0, 188.0, 256.0, 371.0, 514.0, 756.0, 1131.0, 1735.0, 2682.0, 4214.0, 6791.0, 11057.0, 18085.0, 30351.0, 51383.0, 84966.0, 131749.0, 175347.0, 175052.0, 133830.0, 85964.0, 51801.0, 30699.0, 18409.0, 11279.0, 6829.0, 4318.0, 2855.0, 1783.0, 1211.0, 807.0, 580.0, 389.0, 243.0, 174.0, 130.0, 67.0, 72.0, 54.0, 35.0, 15.0, 7.0, 10.0, 5.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0], "bins": [-8.015625, -7.7652587890625, -7.514892578125, -7.2645263671875, -7.01416015625, -6.7637939453125, -6.513427734375, -6.2630615234375, -6.0126953125, -5.7623291015625, -5.511962890625, -5.2615966796875, -5.01123046875, -4.7608642578125, -4.510498046875, -4.2601318359375, -4.009765625, -3.7593994140625, -3.509033203125, -3.2586669921875, -3.00830078125, -2.7579345703125, -2.507568359375, -2.2572021484375, -2.0068359375, -1.7564697265625, -1.506103515625, -1.2557373046875, -1.00537109375, -0.7550048828125, -0.504638671875, -0.2542724609375, -0.00390625, 0.2464599609375, 0.496826171875, 0.7471923828125, 0.99755859375, 1.2479248046875, 1.498291015625, 1.7486572265625, 1.9990234375, 2.2493896484375, 2.499755859375, 2.7501220703125, 3.00048828125, 3.2508544921875, 3.501220703125, 3.7515869140625, 4.001953125, 4.2523193359375, 4.502685546875, 4.7530517578125, 5.00341796875, 5.2537841796875, 5.504150390625, 5.7545166015625, 6.0048828125, 6.2552490234375, 6.505615234375, 6.7559814453125, 7.00634765625, 7.2567138671875, 7.507080078125, 7.7574462890625, 8.0078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 14.0, 16.0, 29.0, 25.0, 21.0, 52.0, 50.0, 66.0, 84.0, 91.0, 79.0, 76.0, 69.0, 68.0, 63.0, 43.0, 29.0, 27.0, 24.0, 13.0, 12.0, 10.0, 9.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005860328674316406, -0.0005631521344184875, -0.0005402714014053345, -0.0005173906683921814, -0.0004945099353790283, -0.00047162920236587524, -0.00044874846935272217, -0.0004258677363395691, -0.000402987003326416, -0.00038010627031326294, -0.00035722553730010986, -0.0003343448042869568, -0.0003114640712738037, -0.00028858333826065063, -0.00026570260524749756, -0.00024282187223434448, -0.0002199411392211914, -0.00019706040620803833, -0.00017417967319488525, -0.00015129894018173218, -0.0001284182071685791, -0.00010553747415542603, -8.265674114227295e-05, -5.977600812911987e-05, -3.68952751159668e-05, -1.401454210281372e-05, 8.866190910339355e-06, 3.174692392349243e-05, 5.462765693664551e-05, 7.750838994979858e-05, 0.00010038912296295166, 0.00012326985597610474, 0.0001461505889892578, 0.0001690313220024109, 0.00019191205501556396, 0.00021479278802871704, 0.00023767352104187012, 0.0002605542540550232, 0.00028343498706817627, 0.00030631572008132935, 0.0003291964530944824, 0.0003520771861076355, 0.0003749579191207886, 0.00039783865213394165, 0.0004207193851470947, 0.0004436001181602478, 0.0004664808511734009, 0.000489361584186554, 0.000512242317199707, 0.0005351230502128601, 0.0005580037832260132, 0.0005808845162391663, 0.0006037652492523193, 0.0006266459822654724, 0.0006495267152786255, 0.0006724074482917786, 0.0006952881813049316, 0.0007181689143180847, 0.0007410496473312378, 0.0007639303803443909, 0.0007868111133575439, 0.000809691846370697, 0.0008325725793838501, 0.0008554533123970032, 0.0008783340454101562]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 12.0, 19.0, 34.0, 47.0, 69.0, 92.0, 162.0, 198.0, 281.0, 463.0, 694.0, 1036.0, 1655.0, 2579.0, 3967.0, 5947.0, 9320.0, 14539.0, 22579.0, 34524.0, 52966.0, 76847.0, 106097.0, 131333.0, 140475.0, 127398.0, 101021.0, 73010.0, 49359.0, 32525.0, 20972.0, 13681.0, 8512.0, 5376.0, 3635.0, 2376.0, 1623.0, 1106.0, 688.0, 384.0, 283.0, 217.0, 149.0, 86.0, 71.0, 40.0, 39.0, 20.0, 15.0, 6.0, 6.0, 6.0, 5.0, 6.0, 1.0, 0.0, 1.0], "bins": [-7.609375, -7.3671875, -7.125, -6.8828125, -6.640625, -6.3984375, -6.15625, -5.9140625, -5.671875, -5.4296875, -5.1875, -4.9453125, -4.703125, -4.4609375, -4.21875, -3.9765625, -3.734375, -3.4921875, -3.25, -3.0078125, -2.765625, -2.5234375, -2.28125, -2.0390625, -1.796875, -1.5546875, -1.3125, -1.0703125, -0.828125, -0.5859375, -0.34375, -0.1015625, 0.140625, 0.3828125, 0.625, 0.8671875, 1.109375, 1.3515625, 1.59375, 1.8359375, 2.078125, 2.3203125, 2.5625, 2.8046875, 3.046875, 3.2890625, 3.53125, 3.7734375, 4.015625, 4.2578125, 4.5, 4.7421875, 4.984375, 5.2265625, 5.46875, 5.7109375, 5.953125, 6.1953125, 6.4375, 6.6796875, 6.921875, 7.1640625, 7.40625, 7.6484375, 7.890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 8.0, 5.0, 13.0, 13.0, 16.0, 25.0, 24.0, 27.0, 32.0, 46.0, 57.0, 54.0, 49.0, 69.0, 58.0, 64.0, 55.0, 48.0, 56.0, 44.0, 44.0, 26.0, 19.0, 21.0, 21.0, 18.0, 15.0, 13.0, 11.0, 6.0, 5.0, 8.0, 3.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4765625, -4.348785400390625, -4.22100830078125, -4.093231201171875, -3.9654541015625, -3.837677001953125, -3.70989990234375, -3.582122802734375, -3.454345703125, -3.326568603515625, -3.19879150390625, -3.071014404296875, -2.9432373046875, -2.815460205078125, -2.68768310546875, -2.559906005859375, -2.43212890625, -2.304351806640625, -2.17657470703125, -2.048797607421875, -1.9210205078125, -1.793243408203125, -1.66546630859375, -1.537689208984375, -1.409912109375, -1.282135009765625, -1.15435791015625, -1.026580810546875, -0.8988037109375, -0.771026611328125, -0.64324951171875, -0.515472412109375, -0.3876953125, -0.259918212890625, -0.13214111328125, -0.004364013671875, 0.1234130859375, 0.251190185546875, 0.37896728515625, 0.506744384765625, 0.634521484375, 0.762298583984375, 0.89007568359375, 1.017852783203125, 1.1456298828125, 1.273406982421875, 1.40118408203125, 1.528961181640625, 1.65673828125, 1.784515380859375, 1.91229248046875, 2.040069580078125, 2.1678466796875, 2.295623779296875, 2.42340087890625, 2.551177978515625, 2.678955078125, 2.806732177734375, 2.93450927734375, 3.062286376953125, 3.1900634765625, 3.317840576171875, 3.44561767578125, 3.573394775390625, 3.701171875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 9.0, 9.0, 13.0, 11.0, 13.0, 15.0, 19.0, 22.0, 33.0, 38.0, 28.0, 46.0, 38.0, 39.0, 46.0, 41.0, 53.0, 46.0, 40.0, 45.0, 47.0, 41.0, 51.0, 24.0, 35.0, 28.0, 28.0, 23.0, 10.0, 20.0, 12.0, 7.0, 11.0, 10.0, 11.0, 10.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-19.86770248413086, -19.252059936523438, -18.636415481567383, -18.02077293395996, -17.40513038635254, -16.789485931396484, -16.173843383789062, -15.55820083618164, -14.942557334899902, -14.326913833618164, -13.711271286010742, -13.095627784729004, -12.479984283447266, -11.864341735839844, -11.248698234558105, -10.633054733276367, -10.017412185668945, -9.401768684387207, -8.786126136779785, -8.170482635498047, -7.554839611053467, -6.939196586608887, -6.323553085327148, -5.707910060882568, -5.092267036437988, -4.476624011993408, -3.860980749130249, -3.24533748626709, -2.6296944618225098, -2.0140514373779297, -1.3984081745147705, -0.7827649116516113, -0.16712379455566406, 0.44851934909820557, 1.0641624927520752, 1.6798056364059448, 2.2954487800598145, 2.9110918045043945, 3.5267350673675537, 4.142378330230713, 4.758021354675293, 5.373664379119873, 5.989307403564453, 6.604950904846191, 7.2205939292907715, 7.836236953735352, 8.45188045501709, 9.067523956298828, 9.68316650390625, 10.298810005187988, 10.91445255279541, 11.530096054077148, 12.14573860168457, 12.761382102966309, 13.377025604248047, 13.992668151855469, 14.608311653137207, 15.223955154418945, 15.839597702026367, 16.45524024963379, 17.070884704589844, 17.686527252197266, 18.302169799804688, 18.917814254760742, 19.533456802368164]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 5.0, 14.0, 17.0, 14.0, 14.0, 11.0, 17.0, 29.0, 24.0, 26.0, 25.0, 20.0, 37.0, 31.0, 44.0, 32.0, 31.0, 42.0, 37.0, 41.0, 37.0, 33.0, 34.0, 33.0, 29.0, 25.0, 32.0, 30.0, 23.0, 19.0, 22.0, 18.0, 21.0, 13.0, 20.0, 15.0, 12.0, 11.0, 9.0, 14.0, 5.0, 7.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.9410343170166, -17.404281616210938, -16.867530822753906, -16.330778121948242, -15.794025421142578, -15.25727367401123, -14.720521926879883, -14.183769226074219, -13.647016525268555, -13.110264778137207, -12.573512077331543, -12.036760330200195, -11.500007629394531, -10.963255882263184, -10.426504135131836, -9.889751434326172, -9.352999687194824, -8.816247940063477, -8.279495239257812, -7.742743492126465, -7.205990791320801, -6.669239044189453, -6.132486820220947, -5.595734596252441, -5.0589823722839355, -4.52223014831543, -3.985477924346924, -3.448725938796997, -2.911973714828491, -2.3752214908599854, -1.8384695053100586, -1.3017172813415527, -0.7649650573730469, -0.2282128930091858, 0.3085392713546753, 0.8452913761138916, 1.3820436000823975, 1.9187958240509033, 2.45554780960083, 2.992300033569336, 3.529052257537842, 4.065804481506348, 4.6025567054748535, 5.139308929443359, 5.676060676574707, 6.212813377380371, 6.749565124511719, 7.286317348480225, 7.8230695724487305, 8.359821319580078, 8.896574020385742, 9.43332576751709, 9.970078468322754, 10.506830215454102, 11.043582916259766, 11.580334663391113, 12.117086410522461, 12.653838157653809, 13.190590858459473, 13.72734260559082, 14.264095306396484, 14.800847053527832, 15.33759880065918, 15.874351501464844, 16.411104202270508]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 12.0, 21.0, 48.0, 57.0, 102.0, 171.0, 298.0, 559.0, 1003.0, 1694.0, 2881.0, 5080.0, 8678.0, 14678.0, 24133.0, 38742.0, 58674.0, 83941.0, 108720.0, 127583.0, 133103.0, 124203.0, 101643.0, 75942.0, 52127.0, 33621.0, 20861.0, 12605.0, 7411.0, 4169.0, 2444.0, 1405.0, 837.0, 472.0, 263.0, 159.0, 77.0, 50.0, 37.0, 13.0, 12.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.453125, -14.98974609375, -14.5263671875, -14.06298828125, -13.599609375, -13.13623046875, -12.6728515625, -12.20947265625, -11.74609375, -11.28271484375, -10.8193359375, -10.35595703125, -9.892578125, -9.42919921875, -8.9658203125, -8.50244140625, -8.0390625, -7.57568359375, -7.1123046875, -6.64892578125, -6.185546875, -5.72216796875, -5.2587890625, -4.79541015625, -4.33203125, -3.86865234375, -3.4052734375, -2.94189453125, -2.478515625, -2.01513671875, -1.5517578125, -1.08837890625, -0.625, -0.16162109375, 0.3017578125, 0.76513671875, 1.228515625, 1.69189453125, 2.1552734375, 2.61865234375, 3.08203125, 3.54541015625, 4.0087890625, 4.47216796875, 4.935546875, 5.39892578125, 5.8623046875, 6.32568359375, 6.7890625, 7.25244140625, 7.7158203125, 8.17919921875, 8.642578125, 9.10595703125, 9.5693359375, 10.03271484375, 10.49609375, 10.95947265625, 11.4228515625, 11.88623046875, 12.349609375, 12.81298828125, 13.2763671875, 13.73974609375, 14.203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 1.0, 7.0, 5.0, 8.0, 6.0, 16.0, 12.0, 11.0, 17.0, 12.0, 22.0, 24.0, 19.0, 26.0, 33.0, 31.0, 31.0, 36.0, 31.0, 25.0, 34.0, 35.0, 44.0, 28.0, 38.0, 42.0, 23.0, 36.0, 41.0, 26.0, 34.0, 22.0, 26.0, 15.0, 25.0, 22.0, 14.0, 13.0, 11.0, 21.0, 15.0, 12.0, 14.0, 7.0, 3.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-17.71875, -17.177978515625, -16.63720703125, -16.096435546875, -15.5556640625, -15.014892578125, -14.47412109375, -13.933349609375, -13.392578125, -12.851806640625, -12.31103515625, -11.770263671875, -11.2294921875, -10.688720703125, -10.14794921875, -9.607177734375, -9.06640625, -8.525634765625, -7.98486328125, -7.444091796875, -6.9033203125, -6.362548828125, -5.82177734375, -5.281005859375, -4.740234375, -4.199462890625, -3.65869140625, -3.117919921875, -2.5771484375, -2.036376953125, -1.49560546875, -0.954833984375, -0.4140625, 0.126708984375, 0.66748046875, 1.208251953125, 1.7490234375, 2.289794921875, 2.83056640625, 3.371337890625, 3.912109375, 4.452880859375, 4.99365234375, 5.534423828125, 6.0751953125, 6.615966796875, 7.15673828125, 7.697509765625, 8.23828125, 8.779052734375, 9.31982421875, 9.860595703125, 10.4013671875, 10.942138671875, 11.48291015625, 12.023681640625, 12.564453125, 13.105224609375, 13.64599609375, 14.186767578125, 14.7275390625, 15.268310546875, 15.80908203125, 16.349853515625, 16.890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 3.0, 10.0, 18.0, 20.0, 30.0, 50.0, 75.0, 125.0, 191.0, 307.0, 506.0, 762.0, 1160.0, 1749.0, 2755.0, 4333.0, 6612.0, 10169.0, 15319.0, 23216.0, 33163.0, 46830.0, 62148.0, 78324.0, 93730.0, 104400.0, 106741.0, 102072.0, 90312.0, 74180.0, 57683.0, 42280.0, 29903.0, 20506.0, 13631.0, 8910.0, 5797.0, 3739.0, 2449.0, 1506.0, 1024.0, 682.0, 395.0, 271.0, 176.0, 110.0, 74.0, 45.0, 34.0, 14.0, 11.0, 9.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3477783203125, -10.961181640625, -10.5745849609375, -10.18798828125, -9.8013916015625, -9.414794921875, -9.0281982421875, -8.6416015625, -8.2550048828125, -7.868408203125, -7.4818115234375, -7.09521484375, -6.7086181640625, -6.322021484375, -5.9354248046875, -5.548828125, -5.1622314453125, -4.775634765625, -4.3890380859375, -4.00244140625, -3.6158447265625, -3.229248046875, -2.8426513671875, -2.4560546875, -2.0694580078125, -1.682861328125, -1.2962646484375, -0.90966796875, -0.5230712890625, -0.136474609375, 0.2501220703125, 0.63671875, 1.0233154296875, 1.409912109375, 1.7965087890625, 2.18310546875, 2.5697021484375, 2.956298828125, 3.3428955078125, 3.7294921875, 4.1160888671875, 4.502685546875, 4.8892822265625, 5.27587890625, 5.6624755859375, 6.049072265625, 6.4356689453125, 6.822265625, 7.2088623046875, 7.595458984375, 7.9820556640625, 8.36865234375, 8.7552490234375, 9.141845703125, 9.5284423828125, 9.9150390625, 10.3016357421875, 10.688232421875, 11.0748291015625, 11.46142578125, 11.8480224609375, 12.234619140625, 12.6212158203125, 13.0078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 3.0, 4.0, 8.0, 5.0, 12.0, 6.0, 16.0, 13.0, 11.0, 15.0, 18.0, 19.0, 25.0, 28.0, 30.0, 31.0, 51.0, 33.0, 51.0, 36.0, 44.0, 47.0, 35.0, 43.0, 50.0, 29.0, 28.0, 33.0, 35.0, 36.0, 25.0, 22.0, 30.0, 25.0, 14.0, 21.0, 13.0, 15.0, 16.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.1796875, -11.7880859375, -11.396484375, -11.0048828125, -10.61328125, -10.2216796875, -9.830078125, -9.4384765625, -9.046875, -8.6552734375, -8.263671875, -7.8720703125, -7.48046875, -7.0888671875, -6.697265625, -6.3056640625, -5.9140625, -5.5224609375, -5.130859375, -4.7392578125, -4.34765625, -3.9560546875, -3.564453125, -3.1728515625, -2.78125, -2.3896484375, -1.998046875, -1.6064453125, -1.21484375, -0.8232421875, -0.431640625, -0.0400390625, 0.3515625, 0.7431640625, 1.134765625, 1.5263671875, 1.91796875, 2.3095703125, 2.701171875, 3.0927734375, 3.484375, 3.8759765625, 4.267578125, 4.6591796875, 5.05078125, 5.4423828125, 5.833984375, 6.2255859375, 6.6171875, 7.0087890625, 7.400390625, 7.7919921875, 8.18359375, 8.5751953125, 8.966796875, 9.3583984375, 9.75, 10.1416015625, 10.533203125, 10.9248046875, 11.31640625, 11.7080078125, 12.099609375, 12.4912109375, 12.8828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 8.0, 13.0, 23.0, 23.0, 45.0, 68.0, 110.0, 219.0, 366.0, 694.0, 1126.0, 2002.0, 3420.0, 6234.0, 10721.0, 18547.0, 30973.0, 49694.0, 74866.0, 103842.0, 129700.0, 141543.0, 134997.0, 112594.0, 83144.0, 56563.0, 35895.0, 21373.0, 12771.0, 7334.0, 4151.0, 2348.0, 1315.0, 734.0, 455.0, 237.0, 154.0, 107.0, 51.0, 33.0, 16.0, 16.0, 8.0, 5.0, 4.0, 9.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.859375, -5.6617431640625, -5.464111328125, -5.2664794921875, -5.06884765625, -4.8712158203125, -4.673583984375, -4.4759521484375, -4.2783203125, -4.0806884765625, -3.883056640625, -3.6854248046875, -3.48779296875, -3.2901611328125, -3.092529296875, -2.8948974609375, -2.697265625, -2.4996337890625, -2.302001953125, -2.1043701171875, -1.90673828125, -1.7091064453125, -1.511474609375, -1.3138427734375, -1.1162109375, -0.9185791015625, -0.720947265625, -0.5233154296875, -0.32568359375, -0.1280517578125, 0.069580078125, 0.2672119140625, 0.46484375, 0.6624755859375, 0.860107421875, 1.0577392578125, 1.25537109375, 1.4530029296875, 1.650634765625, 1.8482666015625, 2.0458984375, 2.2435302734375, 2.441162109375, 2.6387939453125, 2.83642578125, 3.0340576171875, 3.231689453125, 3.4293212890625, 3.626953125, 3.8245849609375, 4.022216796875, 4.2198486328125, 4.41748046875, 4.6151123046875, 4.812744140625, 5.0103759765625, 5.2080078125, 5.4056396484375, 5.603271484375, 5.8009033203125, 5.99853515625, 6.1961669921875, 6.393798828125, 6.5914306640625, 6.7890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 4.0, 5.0, 10.0, 11.0, 11.0, 18.0, 16.0, 28.0, 23.0, 30.0, 33.0, 35.0, 41.0, 57.0, 42.0, 50.0, 53.0, 70.0, 57.0, 48.0, 53.0, 41.0, 37.0, 23.0, 35.0, 29.0, 21.0, 19.0, 17.0, 11.0, 14.0, 7.0, 6.0, 6.0, 7.0, 9.0, 7.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0006823539733886719, -0.0006611272692680359, -0.0006399005651473999, -0.0006186738610267639, -0.0005974471569061279, -0.0005762204527854919, -0.000554993748664856, -0.00053376704454422, -0.000512540340423584, -0.000491313636302948, -0.000470086932182312, -0.000448860228061676, -0.00042763352394104004, -0.00040640681982040405, -0.00038518011569976807, -0.0003639534115791321, -0.0003427267074584961, -0.0003215000033378601, -0.0003002732992172241, -0.00027904659509658813, -0.00025781989097595215, -0.00023659318685531616, -0.00021536648273468018, -0.0001941397786140442, -0.0001729130744934082, -0.00015168637037277222, -0.00013045966625213623, -0.00010923296213150024, -8.800625801086426e-05, -6.677955389022827e-05, -4.5552849769592285e-05, -2.43261456489563e-05, -3.0994415283203125e-06, 1.8127262592315674e-05, 3.935396671295166e-05, 6.0580670833587646e-05, 8.180737495422363e-05, 0.00010303407907485962, 0.0001242607831954956, 0.0001454874873161316, 0.00016671419143676758, 0.00018794089555740356, 0.00020916759967803955, 0.00023039430379867554, 0.0002516210079193115, 0.0002728477120399475, 0.0002940744161605835, 0.0003153011202812195, 0.00033652782440185547, 0.00035775452852249146, 0.00037898123264312744, 0.00040020793676376343, 0.0004214346408843994, 0.0004426613450050354, 0.0004638880491256714, 0.0004851147532463074, 0.0005063414573669434, 0.0005275681614875793, 0.0005487948656082153, 0.0005700215697288513, 0.0005912482738494873, 0.0006124749779701233, 0.0006337016820907593, 0.0006549283862113953, 0.0006761550903320312]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 7.0, 17.0, 27.0, 48.0, 68.0, 112.0, 172.0, 272.0, 401.0, 661.0, 1096.0, 1687.0, 2645.0, 4155.0, 6653.0, 10432.0, 15586.0, 23692.0, 34667.0, 49094.0, 66114.0, 83943.0, 99681.0, 109315.0, 109929.0, 102336.0, 88694.0, 70025.0, 53127.0, 37970.0, 26432.0, 17613.0, 11527.0, 7371.0, 4819.0, 3034.0, 1878.0, 1211.0, 724.0, 492.0, 301.0, 185.0, 122.0, 74.0, 54.0, 33.0, 24.0, 12.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.558349609375, -4.40185546875, -4.245361328125, -4.0888671875, -3.932373046875, -3.77587890625, -3.619384765625, -3.462890625, -3.306396484375, -3.14990234375, -2.993408203125, -2.8369140625, -2.680419921875, -2.52392578125, -2.367431640625, -2.2109375, -2.054443359375, -1.89794921875, -1.741455078125, -1.5849609375, -1.428466796875, -1.27197265625, -1.115478515625, -0.958984375, -0.802490234375, -0.64599609375, -0.489501953125, -0.3330078125, -0.176513671875, -0.02001953125, 0.136474609375, 0.29296875, 0.449462890625, 0.60595703125, 0.762451171875, 0.9189453125, 1.075439453125, 1.23193359375, 1.388427734375, 1.544921875, 1.701416015625, 1.85791015625, 2.014404296875, 2.1708984375, 2.327392578125, 2.48388671875, 2.640380859375, 2.796875, 2.953369140625, 3.10986328125, 3.266357421875, 3.4228515625, 3.579345703125, 3.73583984375, 3.892333984375, 4.048828125, 4.205322265625, 4.36181640625, 4.518310546875, 4.6748046875, 4.831298828125, 4.98779296875, 5.144287109375, 5.30078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 10.0, 14.0, 8.0, 12.0, 13.0, 10.0, 21.0, 16.0, 12.0, 31.0, 25.0, 27.0, 33.0, 39.0, 43.0, 43.0, 30.0, 42.0, 45.0, 40.0, 43.0, 36.0, 41.0, 37.0, 35.0, 37.0, 34.0, 28.0, 33.0, 23.0, 20.0, 22.0, 17.0, 20.0, 10.0, 14.0, 10.0, 3.0, 10.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.763671875, -1.698211669921875, -1.63275146484375, -1.567291259765625, -1.5018310546875, -1.436370849609375, -1.37091064453125, -1.305450439453125, -1.239990234375, -1.174530029296875, -1.10906982421875, -1.043609619140625, -0.9781494140625, -0.912689208984375, -0.84722900390625, -0.781768798828125, -0.71630859375, -0.650848388671875, -0.58538818359375, -0.519927978515625, -0.4544677734375, -0.389007568359375, -0.32354736328125, -0.258087158203125, -0.192626953125, -0.127166748046875, -0.06170654296875, 0.003753662109375, 0.0692138671875, 0.134674072265625, 0.20013427734375, 0.265594482421875, 0.3310546875, 0.396514892578125, 0.46197509765625, 0.527435302734375, 0.5928955078125, 0.658355712890625, 0.72381591796875, 0.789276123046875, 0.854736328125, 0.920196533203125, 0.98565673828125, 1.051116943359375, 1.1165771484375, 1.182037353515625, 1.24749755859375, 1.312957763671875, 1.37841796875, 1.443878173828125, 1.50933837890625, 1.574798583984375, 1.6402587890625, 1.705718994140625, 1.77117919921875, 1.836639404296875, 1.902099609375, 1.967559814453125, 2.03302001953125, 2.098480224609375, 2.1639404296875, 2.229400634765625, 2.29486083984375, 2.360321044921875, 2.42578125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 1.0, 7.0, 6.0, 4.0, 8.0, 14.0, 6.0, 14.0, 13.0, 13.0, 27.0, 34.0, 34.0, 25.0, 30.0, 33.0, 49.0, 33.0, 33.0, 48.0, 46.0, 43.0, 37.0, 39.0, 46.0, 39.0, 31.0, 30.0, 29.0, 30.0, 20.0, 25.0, 31.0, 21.0, 13.0, 17.0, 11.0, 12.0, 6.0, 12.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-16.721254348754883, -16.153564453125, -15.5858736038208, -15.018182754516602, -14.450492858886719, -13.88280200958252, -13.31511116027832, -12.747421264648438, -12.179730415344238, -11.612039566040039, -11.044349670410156, -10.476658821105957, -9.908967971801758, -9.341278076171875, -8.773587226867676, -8.205896377563477, -7.638206481933594, -7.070516109466553, -6.502825736999512, -5.9351348876953125, -5.3674445152282715, -4.7997541427612305, -4.232063293457031, -3.6643729209899902, -3.096682548522949, -2.528992176055908, -1.961301565170288, -1.3936110734939575, -0.825920581817627, -0.25823020935058594, 0.3094604015350342, 0.8771510124206543, 1.4448394775390625, 2.0125298500061035, 2.5802204608917236, 3.1479110717773438, 3.7156014442443848, 4.283291816711426, 4.850982666015625, 5.418673038482666, 5.986363410949707, 6.554053783416748, 7.121744155883789, 7.689435005187988, 8.257125854492188, 8.82481575012207, 9.39250659942627, 9.960197448730469, 10.527887344360352, 11.09557819366455, 11.663268089294434, 12.230958938598633, 12.798648834228516, 13.366339683532715, 13.934030532836914, 14.501720428466797, 15.069411277770996, 15.637102127075195, 16.204792022705078, 16.77248191833496, 17.340173721313477, 17.90786361694336, 18.475553512573242, 19.043245315551758, 19.61093521118164]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 14.0, 11.0, 15.0, 10.0, 19.0, 14.0, 25.0, 18.0, 24.0, 26.0, 20.0, 35.0, 33.0, 39.0, 33.0, 34.0, 37.0, 47.0, 39.0, 33.0, 45.0, 35.0, 36.0, 38.0, 42.0, 32.0, 21.0, 32.0, 21.0, 29.0, 20.0, 15.0, 21.0, 18.0, 13.0, 10.0, 9.0, 8.0, 6.0, 7.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.333984375, -17.72174835205078, -17.109512329101562, -16.497278213500977, -15.885042190551758, -15.272806167602539, -14.660571098327637, -14.048336029052734, -13.436100006103516, -12.823863983154297, -12.211628913879395, -11.599393844604492, -10.987157821655273, -10.374921798706055, -9.762686729431152, -9.15045166015625, -8.538215637207031, -7.925980091094971, -7.31374454498291, -6.70150899887085, -6.089273452758789, -5.4770379066467285, -4.864802360534668, -4.252566814422607, -3.640331268310547, -3.0280957221984863, -2.415860176086426, -1.8036246299743652, -1.1913890838623047, -0.5791535377502441, 0.033082008361816406, 0.645317554473877, 1.2575550079345703, 1.8697905540466309, 2.4820261001586914, 3.094261646270752, 3.7064971923828125, 4.318732738494873, 4.930968284606934, 5.543203830718994, 6.155439376831055, 6.767674922943115, 7.379910469055176, 7.992146015167236, 8.604381561279297, 9.216617584228516, 9.828852653503418, 10.44108772277832, 11.053323745727539, 11.665559768676758, 12.27779483795166, 12.890029907226562, 13.502265930175781, 14.114501953125, 14.726737022399902, 15.338972091674805, 15.951208114624023, 16.563444137573242, 17.175678253173828, 17.787914276123047, 18.400150299072266, 19.012386322021484, 19.624622344970703, 20.23685646057129, 20.849092483520508]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 7.0, 4.0, 15.0, 24.0, 37.0, 36.0, 51.0, 107.0, 163.0, 234.0, 341.0, 511.0, 808.0, 1277.0, 1985.0, 3091.0, 5096.0, 8472.0, 13963.0, 23471.0, 39766.0, 68711.0, 118121.0, 199324.0, 321115.0, 473163.0, 603713.0, 643699.0, 566150.0, 420068.0, 276055.0, 166761.0, 98567.0, 57147.0, 33648.0, 19303.0, 11493.0, 6834.0, 4143.0, 2505.0, 1601.0, 998.0, 645.0, 377.0, 250.0, 154.0, 108.0, 53.0, 52.0, 32.0, 18.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0], "bins": [-16.28125, -15.792724609375, -15.30419921875, -14.815673828125, -14.3271484375, -13.838623046875, -13.35009765625, -12.861572265625, -12.373046875, -11.884521484375, -11.39599609375, -10.907470703125, -10.4189453125, -9.930419921875, -9.44189453125, -8.953369140625, -8.46484375, -7.976318359375, -7.48779296875, -6.999267578125, -6.5107421875, -6.022216796875, -5.53369140625, -5.045166015625, -4.556640625, -4.068115234375, -3.57958984375, -3.091064453125, -2.6025390625, -2.114013671875, -1.62548828125, -1.136962890625, -0.6484375, -0.159912109375, 0.32861328125, 0.817138671875, 1.3056640625, 1.794189453125, 2.28271484375, 2.771240234375, 3.259765625, 3.748291015625, 4.23681640625, 4.725341796875, 5.2138671875, 5.702392578125, 6.19091796875, 6.679443359375, 7.16796875, 7.656494140625, 8.14501953125, 8.633544921875, 9.1220703125, 9.610595703125, 10.09912109375, 10.587646484375, 11.076171875, 11.564697265625, 12.05322265625, 12.541748046875, 13.0302734375, 13.518798828125, 14.00732421875, 14.495849609375, 14.984375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 3.0, 9.0, 17.0, 16.0, 7.0, 16.0, 23.0, 23.0, 27.0, 22.0, 29.0, 28.0, 33.0, 17.0, 28.0, 34.0, 38.0, 25.0, 41.0, 38.0, 42.0, 35.0, 39.0, 30.0, 34.0, 37.0, 27.0, 20.0, 27.0, 23.0, 22.0, 20.0, 18.0, 24.0, 17.0, 17.0, 15.0, 17.0, 6.0, 4.0, 10.0, 9.0, 4.0, 1.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-15.265625, -14.7884521484375, -14.311279296875, -13.8341064453125, -13.35693359375, -12.8797607421875, -12.402587890625, -11.9254150390625, -11.4482421875, -10.9710693359375, -10.493896484375, -10.0167236328125, -9.53955078125, -9.0623779296875, -8.585205078125, -8.1080322265625, -7.630859375, -7.1536865234375, -6.676513671875, -6.1993408203125, -5.72216796875, -5.2449951171875, -4.767822265625, -4.2906494140625, -3.8134765625, -3.3363037109375, -2.859130859375, -2.3819580078125, -1.90478515625, -1.4276123046875, -0.950439453125, -0.4732666015625, 0.00390625, 0.4810791015625, 0.958251953125, 1.4354248046875, 1.91259765625, 2.3897705078125, 2.866943359375, 3.3441162109375, 3.8212890625, 4.2984619140625, 4.775634765625, 5.2528076171875, 5.72998046875, 6.2071533203125, 6.684326171875, 7.1614990234375, 7.638671875, 8.1158447265625, 8.593017578125, 9.0701904296875, 9.54736328125, 10.0245361328125, 10.501708984375, 10.9788818359375, 11.4560546875, 11.9332275390625, 12.410400390625, 12.8875732421875, 13.36474609375, 13.8419189453125, 14.319091796875, 14.7962646484375, 15.2734375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 12.0, 14.0, 23.0, 43.0, 65.0, 111.0, 145.0, 295.0, 430.0, 676.0, 1115.0, 1908.0, 3232.0, 5587.0, 9589.0, 16428.0, 29192.0, 50770.0, 87417.0, 149491.0, 246541.0, 382415.0, 533270.0, 637130.0, 624706.0, 507071.0, 355091.0, 227089.0, 136787.0, 79250.0, 45905.0, 26083.0, 14930.0, 8789.0, 5116.0, 3043.0, 1772.0, 1074.0, 677.0, 387.0, 220.0, 137.0, 94.0, 59.0, 35.0, 32.0, 12.0, 14.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.59912109375, -17.0107421875, -16.42236328125, -15.833984375, -15.24560546875, -14.6572265625, -14.06884765625, -13.48046875, -12.89208984375, -12.3037109375, -11.71533203125, -11.126953125, -10.53857421875, -9.9501953125, -9.36181640625, -8.7734375, -8.18505859375, -7.5966796875, -7.00830078125, -6.419921875, -5.83154296875, -5.2431640625, -4.65478515625, -4.06640625, -3.47802734375, -2.8896484375, -2.30126953125, -1.712890625, -1.12451171875, -0.5361328125, 0.05224609375, 0.640625, 1.22900390625, 1.8173828125, 2.40576171875, 2.994140625, 3.58251953125, 4.1708984375, 4.75927734375, 5.34765625, 5.93603515625, 6.5244140625, 7.11279296875, 7.701171875, 8.28955078125, 8.8779296875, 9.46630859375, 10.0546875, 10.64306640625, 11.2314453125, 11.81982421875, 12.408203125, 12.99658203125, 13.5849609375, 14.17333984375, 14.76171875, 15.35009765625, 15.9384765625, 16.52685546875, 17.115234375, 17.70361328125, 18.2919921875, 18.88037109375, 19.46875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 9.0, 11.0, 26.0, 21.0, 27.0, 38.0, 41.0, 58.0, 60.0, 80.0, 110.0, 127.0, 151.0, 170.0, 210.0, 237.0, 231.0, 256.0, 234.0, 262.0, 238.0, 226.0, 200.0, 203.0, 149.0, 142.0, 126.0, 103.0, 87.0, 61.0, 50.0, 39.0, 25.0, 21.0, 11.0, 11.0, 8.0, 7.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.78515625, -7.52044677734375, -7.2557373046875, -6.99102783203125, -6.726318359375, -6.46160888671875, -6.1968994140625, -5.93218994140625, -5.66748046875, -5.40277099609375, -5.1380615234375, -4.87335205078125, -4.608642578125, -4.34393310546875, -4.0792236328125, -3.81451416015625, -3.5498046875, -3.28509521484375, -3.0203857421875, -2.75567626953125, -2.490966796875, -2.22625732421875, -1.9615478515625, -1.69683837890625, -1.43212890625, -1.16741943359375, -0.9027099609375, -0.63800048828125, -0.373291015625, -0.10858154296875, 0.1561279296875, 0.42083740234375, 0.685546875, 0.95025634765625, 1.2149658203125, 1.47967529296875, 1.744384765625, 2.00909423828125, 2.2738037109375, 2.53851318359375, 2.80322265625, 3.06793212890625, 3.3326416015625, 3.59735107421875, 3.862060546875, 4.12677001953125, 4.3914794921875, 4.65618896484375, 4.9208984375, 5.18560791015625, 5.4503173828125, 5.71502685546875, 5.979736328125, 6.24444580078125, 6.5091552734375, 6.77386474609375, 7.03857421875, 7.30328369140625, 7.5679931640625, 7.83270263671875, 8.097412109375, 8.36212158203125, 8.6268310546875, 8.89154052734375, 9.15625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 14.0, 12.0, 18.0, 22.0, 16.0, 30.0, 29.0, 30.0, 33.0, 39.0, 39.0, 51.0, 50.0, 46.0, 47.0, 46.0, 40.0, 47.0, 61.0, 41.0, 42.0, 40.0, 31.0, 18.0, 21.0, 23.0, 26.0, 23.0, 10.0, 16.0, 6.0, 8.0, 4.0, 0.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.351669311523438, -19.65229606628418, -18.952922821044922, -18.253549575805664, -17.554176330566406, -16.85480308532715, -16.15542984008789, -15.456056594848633, -14.756683349609375, -14.057310104370117, -13.35793685913086, -12.658563613891602, -11.959190368652344, -11.259817123413086, -10.560443878173828, -9.86107063293457, -9.161697387695312, -8.462324142456055, -7.762950897216797, -7.063577651977539, -6.364204406738281, -5.664831161499023, -4.965457916259766, -4.266084671020508, -3.56671142578125, -2.867338180541992, -2.1679649353027344, -1.4685916900634766, -0.7692184448242188, -0.06984519958496094, 0.6295280456542969, 1.3289012908935547, 2.0282764434814453, 2.727649688720703, 3.427022933959961, 4.126396179199219, 4.825769424438477, 5.525142669677734, 6.224515914916992, 6.92388916015625, 7.623262405395508, 8.322635650634766, 9.022008895874023, 9.721382141113281, 10.420755386352539, 11.120128631591797, 11.819501876831055, 12.518875122070312, 13.21824836730957, 13.917621612548828, 14.616994857788086, 15.316368103027344, 16.0157413482666, 16.71511459350586, 17.414487838745117, 18.113861083984375, 18.813234329223633, 19.51260757446289, 20.21198081970215, 20.911354064941406, 21.610727310180664, 22.310100555419922, 23.00947380065918, 23.708847045898438, 24.408220291137695]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 5.0, 3.0, 4.0, 6.0, 11.0, 11.0, 17.0, 20.0, 18.0, 21.0, 24.0, 25.0, 29.0, 38.0, 36.0, 25.0, 46.0, 47.0, 43.0, 46.0, 39.0, 39.0, 51.0, 40.0, 40.0, 42.0, 34.0, 28.0, 23.0, 25.0, 28.0, 24.0, 22.0, 15.0, 12.0, 19.0, 16.0, 11.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.457382202148438, -17.819278717041016, -17.181175231933594, -16.543071746826172, -15.90496826171875, -15.266864776611328, -14.628761291503906, -13.990657806396484, -13.352554321289062, -12.71445083618164, -12.076347351074219, -11.438243865966797, -10.800140380859375, -10.162036895751953, -9.523933410644531, -8.88582992553711, -8.247726440429688, -7.609622955322266, -6.971519470214844, -6.333415985107422, -5.6953125, -5.057209014892578, -4.419105529785156, -3.7810020446777344, -3.1428985595703125, -2.5047950744628906, -1.8666915893554688, -1.2285881042480469, -0.590484619140625, 0.047618865966796875, 0.6857223510742188, 1.3238258361816406, 1.9619293212890625, 2.6000328063964844, 3.2381362915039062, 3.876239776611328, 4.51434326171875, 5.152446746826172, 5.790550231933594, 6.428653717041016, 7.0667572021484375, 7.704860687255859, 8.342964172363281, 8.981067657470703, 9.619171142578125, 10.257274627685547, 10.895378112792969, 11.53348159790039, 12.171585083007812, 12.809688568115234, 13.447792053222656, 14.085895538330078, 14.7239990234375, 15.362102508544922, 16.000205993652344, 16.638309478759766, 17.276412963867188, 17.91451644897461, 18.55261993408203, 19.190723419189453, 19.828826904296875, 20.466930389404297, 21.10503387451172, 21.74313735961914, 22.381240844726562]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 10.0, 8.0, 18.0, 31.0, 33.0, 54.0, 80.0, 149.0, 234.0, 375.0, 592.0, 962.0, 1550.0, 2508.0, 3945.0, 6426.0, 10275.0, 16883.0, 26479.0, 41017.0, 60650.0, 85096.0, 109059.0, 127331.0, 130225.0, 119083.0, 96159.0, 71876.0, 49278.0, 33179.0, 20884.0, 12985.0, 8067.0, 4974.0, 3016.0, 1947.0, 1144.0, 711.0, 451.0, 297.0, 184.0, 121.0, 79.0, 48.0, 26.0, 16.0, 12.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.5078125, -10.17138671875, -9.8349609375, -9.49853515625, -9.162109375, -8.82568359375, -8.4892578125, -8.15283203125, -7.81640625, -7.47998046875, -7.1435546875, -6.80712890625, -6.470703125, -6.13427734375, -5.7978515625, -5.46142578125, -5.125, -4.78857421875, -4.4521484375, -4.11572265625, -3.779296875, -3.44287109375, -3.1064453125, -2.77001953125, -2.43359375, -2.09716796875, -1.7607421875, -1.42431640625, -1.087890625, -0.75146484375, -0.4150390625, -0.07861328125, 0.2578125, 0.59423828125, 0.9306640625, 1.26708984375, 1.603515625, 1.93994140625, 2.2763671875, 2.61279296875, 2.94921875, 3.28564453125, 3.6220703125, 3.95849609375, 4.294921875, 4.63134765625, 4.9677734375, 5.30419921875, 5.640625, 5.97705078125, 6.3134765625, 6.64990234375, 6.986328125, 7.32275390625, 7.6591796875, 7.99560546875, 8.33203125, 8.66845703125, 9.0048828125, 9.34130859375, 9.677734375, 10.01416015625, 10.3505859375, 10.68701171875, 11.0234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 7.0, 12.0, 11.0, 12.0, 12.0, 10.0, 22.0, 16.0, 20.0, 19.0, 27.0, 33.0, 31.0, 33.0, 28.0, 27.0, 49.0, 42.0, 31.0, 48.0, 41.0, 35.0, 48.0, 36.0, 38.0, 39.0, 23.0, 23.0, 20.0, 31.0, 22.0, 23.0, 16.0, 16.0, 25.0, 12.0, 10.0, 14.0, 3.0, 12.0, 11.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.625, -18.03125, -17.4375, -16.84375, -16.25, -15.65625, -15.0625, -14.46875, -13.875, -13.28125, -12.6875, -12.09375, -11.5, -10.90625, -10.3125, -9.71875, -9.125, -8.53125, -7.9375, -7.34375, -6.75, -6.15625, -5.5625, -4.96875, -4.375, -3.78125, -3.1875, -2.59375, -2.0, -1.40625, -0.8125, -0.21875, 0.375, 0.96875, 1.5625, 2.15625, 2.75, 3.34375, 3.9375, 4.53125, 5.125, 5.71875, 6.3125, 6.90625, 7.5, 8.09375, 8.6875, 9.28125, 9.875, 10.46875, 11.0625, 11.65625, 12.25, 12.84375, 13.4375, 14.03125, 14.625, 15.21875, 15.8125, 16.40625, 17.0, 17.59375, 18.1875, 18.78125, 19.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 13.0, 13.0, 24.0, 30.0, 48.0, 76.0, 128.0, 188.0, 294.0, 399.0, 658.0, 1026.0, 1695.0, 2778.0, 4642.0, 7849.0, 13339.0, 23199.0, 39968.0, 67060.0, 104994.0, 149002.0, 171532.0, 157067.0, 116240.0, 75849.0, 45854.0, 26479.0, 15553.0, 9113.0, 5269.0, 3078.0, 1977.0, 1142.0, 703.0, 428.0, 302.0, 163.0, 120.0, 90.0, 54.0, 37.0, 28.0, 14.0, 13.0, 10.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.65625, -16.129638671875, -15.60302734375, -15.076416015625, -14.5498046875, -14.023193359375, -13.49658203125, -12.969970703125, -12.443359375, -11.916748046875, -11.39013671875, -10.863525390625, -10.3369140625, -9.810302734375, -9.28369140625, -8.757080078125, -8.23046875, -7.703857421875, -7.17724609375, -6.650634765625, -6.1240234375, -5.597412109375, -5.07080078125, -4.544189453125, -4.017578125, -3.490966796875, -2.96435546875, -2.437744140625, -1.9111328125, -1.384521484375, -0.85791015625, -0.331298828125, 0.1953125, 0.721923828125, 1.24853515625, 1.775146484375, 2.3017578125, 2.828369140625, 3.35498046875, 3.881591796875, 4.408203125, 4.934814453125, 5.46142578125, 5.988037109375, 6.5146484375, 7.041259765625, 7.56787109375, 8.094482421875, 8.62109375, 9.147705078125, 9.67431640625, 10.200927734375, 10.7275390625, 11.254150390625, 11.78076171875, 12.307373046875, 12.833984375, 13.360595703125, 13.88720703125, 14.413818359375, 14.9404296875, 15.467041015625, 15.99365234375, 16.520263671875, 17.046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 4.0, 9.0, 14.0, 6.0, 13.0, 27.0, 19.0, 16.0, 21.0, 16.0, 33.0, 23.0, 25.0, 31.0, 41.0, 40.0, 36.0, 44.0, 31.0, 42.0, 33.0, 28.0, 37.0, 40.0, 25.0, 38.0, 36.0, 28.0, 28.0, 30.0, 15.0, 20.0, 19.0, 19.0, 15.0, 18.0, 9.0, 12.0, 9.0, 9.0, 9.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-11.8125, -11.4539794921875, -11.095458984375, -10.7369384765625, -10.37841796875, -10.0198974609375, -9.661376953125, -9.3028564453125, -8.9443359375, -8.5858154296875, -8.227294921875, -7.8687744140625, -7.51025390625, -7.1517333984375, -6.793212890625, -6.4346923828125, -6.076171875, -5.7176513671875, -5.359130859375, -5.0006103515625, -4.64208984375, -4.2835693359375, -3.925048828125, -3.5665283203125, -3.2080078125, -2.8494873046875, -2.490966796875, -2.1324462890625, -1.77392578125, -1.4154052734375, -1.056884765625, -0.6983642578125, -0.33984375, 0.0186767578125, 0.377197265625, 0.7357177734375, 1.09423828125, 1.4527587890625, 1.811279296875, 2.1697998046875, 2.5283203125, 2.8868408203125, 3.245361328125, 3.6038818359375, 3.96240234375, 4.3209228515625, 4.679443359375, 5.0379638671875, 5.396484375, 5.7550048828125, 6.113525390625, 6.4720458984375, 6.83056640625, 7.1890869140625, 7.547607421875, 7.9061279296875, 8.2646484375, 8.6231689453125, 8.981689453125, 9.3402099609375, 9.69873046875, 10.0572509765625, 10.415771484375, 10.7742919921875, 11.1328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 12.0, 20.0, 27.0, 36.0, 68.0, 86.0, 167.0, 208.0, 304.0, 488.0, 739.0, 1094.0, 1719.0, 2685.0, 4196.0, 6817.0, 10731.0, 17258.0, 27542.0, 43282.0, 67099.0, 97967.0, 131682.0, 151988.0, 143752.0, 114291.0, 79670.0, 52837.0, 33878.0, 21431.0, 13350.0, 8299.0, 5268.0, 3315.0, 2132.0, 1405.0, 876.0, 635.0, 401.0, 249.0, 175.0, 138.0, 71.0, 42.0, 40.0, 25.0, 18.0, 14.0, 12.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.30859375, -6.1097412109375, -5.910888671875, -5.7120361328125, -5.51318359375, -5.3143310546875, -5.115478515625, -4.9166259765625, -4.7177734375, -4.5189208984375, -4.320068359375, -4.1212158203125, -3.92236328125, -3.7235107421875, -3.524658203125, -3.3258056640625, -3.126953125, -2.9281005859375, -2.729248046875, -2.5303955078125, -2.33154296875, -2.1326904296875, -1.933837890625, -1.7349853515625, -1.5361328125, -1.3372802734375, -1.138427734375, -0.9395751953125, -0.74072265625, -0.5418701171875, -0.343017578125, -0.1441650390625, 0.0546875, 0.2535400390625, 0.452392578125, 0.6512451171875, 0.85009765625, 1.0489501953125, 1.247802734375, 1.4466552734375, 1.6455078125, 1.8443603515625, 2.043212890625, 2.2420654296875, 2.44091796875, 2.6397705078125, 2.838623046875, 3.0374755859375, 3.236328125, 3.4351806640625, 3.634033203125, 3.8328857421875, 4.03173828125, 4.2305908203125, 4.429443359375, 4.6282958984375, 4.8271484375, 5.0260009765625, 5.224853515625, 5.4237060546875, 5.62255859375, 5.8214111328125, 6.020263671875, 6.2191162109375, 6.41796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 8.0, 2.0, 5.0, 7.0, 4.0, 13.0, 13.0, 9.0, 21.0, 27.0, 28.0, 29.0, 37.0, 45.0, 29.0, 42.0, 61.0, 50.0, 47.0, 43.0, 52.0, 46.0, 42.0, 38.0, 48.0, 32.0, 29.0, 31.0, 29.0, 25.0, 15.0, 25.0, 14.0, 10.0, 10.0, 8.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0], "bins": [-0.0005035400390625, -0.0004904791712760925, -0.00047741830348968506, -0.0004643574357032776, -0.0004512965679168701, -0.00043823570013046265, -0.0004251748323440552, -0.0004121139645576477, -0.00039905309677124023, -0.00038599222898483276, -0.0003729313611984253, -0.0003598704934120178, -0.00034680962562561035, -0.0003337487578392029, -0.0003206878900527954, -0.00030762702226638794, -0.00029456615447998047, -0.000281505286693573, -0.00026844441890716553, -0.00025538355112075806, -0.00024232268333435059, -0.00022926181554794312, -0.00021620094776153564, -0.00020314007997512817, -0.0001900792121887207, -0.00017701834440231323, -0.00016395747661590576, -0.0001508966088294983, -0.00013783574104309082, -0.00012477487325668335, -0.00011171400547027588, -9.865313768386841e-05, -8.559226989746094e-05, -7.253140211105347e-05, -5.9470534324645996e-05, -4.6409666538238525e-05, -3.3348798751831055e-05, -2.0287930965423584e-05, -7.227063179016113e-06, 5.833804607391357e-06, 1.8894672393798828e-05, 3.19555401802063e-05, 4.501640796661377e-05, 5.807727575302124e-05, 7.113814353942871e-05, 8.419901132583618e-05, 9.725987911224365e-05, 0.00011032074689865112, 0.0001233816146850586, 0.00013644248247146606, 0.00014950335025787354, 0.000162564218044281, 0.00017562508583068848, 0.00018868595361709595, 0.00020174682140350342, 0.0002148076891899109, 0.00022786855697631836, 0.00024092942476272583, 0.0002539902925491333, 0.00026705116033554077, 0.00028011202812194824, 0.0002931728959083557, 0.0003062337636947632, 0.00031929463148117065, 0.0003323554992675781]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 13.0, 14.0, 14.0, 30.0, 52.0, 79.0, 92.0, 160.0, 215.0, 354.0, 544.0, 766.0, 1192.0, 1808.0, 2924.0, 4550.0, 7190.0, 11440.0, 17748.0, 27551.0, 41517.0, 60367.0, 83916.0, 107285.0, 124562.0, 127615.0, 116803.0, 95481.0, 71248.0, 49642.0, 33045.0, 21815.0, 13912.0, 8869.0, 5549.0, 3655.0, 2350.0, 1423.0, 967.0, 614.0, 428.0, 235.0, 182.0, 113.0, 83.0, 53.0, 33.0, 16.0, 14.0, 13.0, 5.0, 6.0, 1.0, 1.0, 1.0, 3.0], "bins": [-6.96484375, -6.7552490234375, -6.545654296875, -6.3360595703125, -6.12646484375, -5.9168701171875, -5.707275390625, -5.4976806640625, -5.2880859375, -5.0784912109375, -4.868896484375, -4.6593017578125, -4.44970703125, -4.2401123046875, -4.030517578125, -3.8209228515625, -3.611328125, -3.4017333984375, -3.192138671875, -2.9825439453125, -2.77294921875, -2.5633544921875, -2.353759765625, -2.1441650390625, -1.9345703125, -1.7249755859375, -1.515380859375, -1.3057861328125, -1.09619140625, -0.8865966796875, -0.677001953125, -0.4674072265625, -0.2578125, -0.0482177734375, 0.161376953125, 0.3709716796875, 0.58056640625, 0.7901611328125, 0.999755859375, 1.2093505859375, 1.4189453125, 1.6285400390625, 1.838134765625, 2.0477294921875, 2.25732421875, 2.4669189453125, 2.676513671875, 2.8861083984375, 3.095703125, 3.3052978515625, 3.514892578125, 3.7244873046875, 3.93408203125, 4.1436767578125, 4.353271484375, 4.5628662109375, 4.7724609375, 4.9820556640625, 5.191650390625, 5.4012451171875, 5.61083984375, 5.8204345703125, 6.030029296875, 6.2396240234375, 6.44921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 8.0, 5.0, 7.0, 10.0, 11.0, 13.0, 8.0, 20.0, 17.0, 21.0, 29.0, 35.0, 50.0, 48.0, 46.0, 43.0, 53.0, 60.0, 51.0, 63.0, 48.0, 48.0, 39.0, 39.0, 51.0, 30.0, 37.0, 24.0, 21.0, 15.0, 7.0, 11.0, 6.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.998046875, -2.90325927734375, -2.8084716796875, -2.71368408203125, -2.618896484375, -2.52410888671875, -2.4293212890625, -2.33453369140625, -2.23974609375, -2.14495849609375, -2.0501708984375, -1.95538330078125, -1.860595703125, -1.76580810546875, -1.6710205078125, -1.57623291015625, -1.4814453125, -1.38665771484375, -1.2918701171875, -1.19708251953125, -1.102294921875, -1.00750732421875, -0.9127197265625, -0.81793212890625, -0.72314453125, -0.62835693359375, -0.5335693359375, -0.43878173828125, -0.343994140625, -0.24920654296875, -0.1544189453125, -0.05963134765625, 0.03515625, 0.12994384765625, 0.2247314453125, 0.31951904296875, 0.414306640625, 0.50909423828125, 0.6038818359375, 0.69866943359375, 0.79345703125, 0.88824462890625, 0.9830322265625, 1.07781982421875, 1.172607421875, 1.26739501953125, 1.3621826171875, 1.45697021484375, 1.5517578125, 1.64654541015625, 1.7413330078125, 1.83612060546875, 1.930908203125, 2.02569580078125, 2.1204833984375, 2.21527099609375, 2.31005859375, 2.40484619140625, 2.4996337890625, 2.59442138671875, 2.689208984375, 2.78399658203125, 2.8787841796875, 2.97357177734375, 3.068359375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 2.0, 4.0, 10.0, 9.0, 12.0, 21.0, 21.0, 37.0, 27.0, 39.0, 24.0, 31.0, 44.0, 47.0, 54.0, 49.0, 45.0, 52.0, 53.0, 53.0, 51.0, 44.0, 51.0, 33.0, 26.0, 23.0, 21.0, 17.0, 27.0, 26.0, 12.0, 15.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15675163269043, -19.442813873291016, -18.728878021240234, -18.01494026184082, -17.301002502441406, -16.587064743041992, -15.873127937316895, -15.159191131591797, -14.445253372192383, -13.731315612792969, -13.017378807067871, -12.303442001342773, -11.58950424194336, -10.875566482543945, -10.161629676818848, -9.44769287109375, -8.733755111694336, -8.019817352294922, -7.305880546569824, -6.591943264007568, -5.8780059814453125, -5.164068698883057, -4.450131416320801, -3.736194133758545, -3.022256851196289, -2.308319568634033, -1.5943822860717773, -0.8804450035095215, -0.16650772094726562, 0.5474295616149902, 1.261366844177246, 1.975304126739502, 2.6892433166503906, 3.4031805992126465, 4.117117881774902, 4.831055164337158, 5.544992446899414, 6.25892972946167, 6.972867012023926, 7.686804294586182, 8.400741577148438, 9.114679336547852, 9.82861614227295, 10.542552947998047, 11.256490707397461, 11.970428466796875, 12.684365272521973, 13.39830207824707, 14.112239837646484, 14.826177597045898, 15.540114402770996, 16.254051208496094, 16.967988967895508, 17.681926727294922, 18.395862579345703, 19.109800338745117, 19.82373809814453, 20.537675857543945, 21.25161361694336, 21.96554946899414, 22.679487228393555, 23.39342498779297, 24.10736083984375, 24.821298599243164, 25.535236358642578]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 1.0, 3.0, 8.0, 13.0, 12.0, 11.0, 19.0, 16.0, 19.0, 27.0, 25.0, 25.0, 38.0, 35.0, 26.0, 42.0, 39.0, 44.0, 39.0, 49.0, 49.0, 45.0, 40.0, 34.0, 38.0, 45.0, 27.0, 30.0, 20.0, 26.0, 23.0, 21.0, 23.0, 18.0, 12.0, 17.0, 13.0, 9.0, 8.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.175724029541016, -17.55483055114746, -16.933937072753906, -16.313045501708984, -15.69215202331543, -15.071258544921875, -14.45036506652832, -13.829471588134766, -13.208579063415527, -12.587685585021973, -11.966793060302734, -11.34589958190918, -10.725006103515625, -10.104113578796387, -9.483220100402832, -8.862327575683594, -8.241434097290039, -7.620541095733643, -6.999648094177246, -6.378754615783691, -5.757861614227295, -5.136968612670898, -4.516075134277344, -3.8951821327209473, -3.274289131164551, -2.6533961296081543, -2.0325028896331787, -1.4116097688674927, -0.7907166481018066, -0.16982364654541016, 0.45106959342956543, 1.071962833404541, 1.6928539276123047, 2.313746929168701, 2.9346401691436768, 3.5555334091186523, 4.176426410675049, 4.797319412231445, 5.418212890625, 6.0391058921813965, 6.659998893737793, 7.2808918952941895, 7.901784896850586, 8.52267837524414, 9.143571853637695, 9.764464378356934, 10.385357856750488, 11.006250381469727, 11.627143859863281, 12.248037338256836, 12.868929862976074, 13.489823341369629, 14.110715866088867, 14.731609344482422, 15.352502822875977, 15.973396301269531, 16.594287872314453, 17.215181350708008, 17.836074829101562, 18.456966400146484, 19.07785987854004, 19.698753356933594, 20.31964683532715, 20.940540313720703, 21.561433792114258]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 6.0, 8.0, 12.0, 16.0, 24.0, 52.0, 61.0, 91.0, 138.0, 251.0, 346.0, 590.0, 906.0, 1479.0, 2362.0, 3617.0, 5746.0, 8909.0, 13522.0, 20726.0, 30548.0, 42404.0, 58020.0, 74451.0, 90422.0, 102069.0, 107495.0, 104884.0, 94055.0, 78497.0, 62061.0, 46027.0, 33000.0, 22880.0, 15333.0, 9984.0, 6383.0, 4085.0, 2637.0, 1618.0, 1054.0, 665.0, 405.0, 263.0, 160.0, 101.0, 63.0, 48.0, 32.0, 17.0, 18.0, 5.0, 5.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.3984375, -11.0262451171875, -10.654052734375, -10.2818603515625, -9.90966796875, -9.5374755859375, -9.165283203125, -8.7930908203125, -8.4208984375, -8.0487060546875, -7.676513671875, -7.3043212890625, -6.93212890625, -6.5599365234375, -6.187744140625, -5.8155517578125, -5.443359375, -5.0711669921875, -4.698974609375, -4.3267822265625, -3.95458984375, -3.5823974609375, -3.210205078125, -2.8380126953125, -2.4658203125, -2.0936279296875, -1.721435546875, -1.3492431640625, -0.97705078125, -0.6048583984375, -0.232666015625, 0.1395263671875, 0.51171875, 0.8839111328125, 1.256103515625, 1.6282958984375, 2.00048828125, 2.3726806640625, 2.744873046875, 3.1170654296875, 3.4892578125, 3.8614501953125, 4.233642578125, 4.6058349609375, 4.97802734375, 5.3502197265625, 5.722412109375, 6.0946044921875, 6.466796875, 6.8389892578125, 7.211181640625, 7.5833740234375, 7.95556640625, 8.3277587890625, 8.699951171875, 9.0721435546875, 9.4443359375, 9.8165283203125, 10.188720703125, 10.5609130859375, 10.93310546875, 11.3052978515625, 11.677490234375, 12.0496826171875, 12.421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 4.0, 11.0, 19.0, 9.0, 23.0, 27.0, 18.0, 29.0, 36.0, 29.0, 36.0, 34.0, 42.0, 45.0, 35.0, 41.0, 44.0, 56.0, 50.0, 36.0, 52.0, 40.0, 41.0, 29.0, 34.0, 34.0, 28.0, 20.0, 8.0, 17.0, 21.0, 14.0, 7.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.836669921875, -18.14208984375, -17.447509765625, -16.7529296875, -16.058349609375, -15.36376953125, -14.669189453125, -13.974609375, -13.280029296875, -12.58544921875, -11.890869140625, -11.1962890625, -10.501708984375, -9.80712890625, -9.112548828125, -8.41796875, -7.723388671875, -7.02880859375, -6.334228515625, -5.6396484375, -4.945068359375, -4.25048828125, -3.555908203125, -2.861328125, -2.166748046875, -1.47216796875, -0.777587890625, -0.0830078125, 0.611572265625, 1.30615234375, 2.000732421875, 2.6953125, 3.389892578125, 4.08447265625, 4.779052734375, 5.4736328125, 6.168212890625, 6.86279296875, 7.557373046875, 8.251953125, 8.946533203125, 9.64111328125, 10.335693359375, 11.0302734375, 11.724853515625, 12.41943359375, 13.114013671875, 13.80859375, 14.503173828125, 15.19775390625, 15.892333984375, 16.5869140625, 17.281494140625, 17.97607421875, 18.670654296875, 19.365234375, 20.059814453125, 20.75439453125, 21.448974609375, 22.1435546875, 22.838134765625, 23.53271484375, 24.227294921875, 24.921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 8.0, 10.0, 18.0, 35.0, 70.0, 72.0, 116.0, 235.0, 351.0, 467.0, 805.0, 1270.0, 2030.0, 3087.0, 4705.0, 7160.0, 11480.0, 17361.0, 26060.0, 37469.0, 52682.0, 69850.0, 87747.0, 102608.0, 110087.0, 109776.0, 99985.0, 84010.0, 66037.0, 49234.0, 34756.0, 23758.0, 16018.0, 10478.0, 6789.0, 4206.0, 2684.0, 1795.0, 1164.0, 726.0, 493.0, 313.0, 194.0, 126.0, 72.0, 55.0, 31.0, 27.0, 12.0, 11.0, 7.0, 6.0, 4.0, 3.0, 3.0], "bins": [-13.6953125, -13.291259765625, -12.88720703125, -12.483154296875, -12.0791015625, -11.675048828125, -11.27099609375, -10.866943359375, -10.462890625, -10.058837890625, -9.65478515625, -9.250732421875, -8.8466796875, -8.442626953125, -8.03857421875, -7.634521484375, -7.23046875, -6.826416015625, -6.42236328125, -6.018310546875, -5.6142578125, -5.210205078125, -4.80615234375, -4.402099609375, -3.998046875, -3.593994140625, -3.18994140625, -2.785888671875, -2.3818359375, -1.977783203125, -1.57373046875, -1.169677734375, -0.765625, -0.361572265625, 0.04248046875, 0.446533203125, 0.8505859375, 1.254638671875, 1.65869140625, 2.062744140625, 2.466796875, 2.870849609375, 3.27490234375, 3.678955078125, 4.0830078125, 4.487060546875, 4.89111328125, 5.295166015625, 5.69921875, 6.103271484375, 6.50732421875, 6.911376953125, 7.3154296875, 7.719482421875, 8.12353515625, 8.527587890625, 8.931640625, 9.335693359375, 9.73974609375, 10.143798828125, 10.5478515625, 10.951904296875, 11.35595703125, 11.760009765625, 12.1640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 2.0, 6.0, 7.0, 10.0, 8.0, 20.0, 8.0, 16.0, 13.0, 20.0, 26.0, 24.0, 36.0, 19.0, 35.0, 38.0, 24.0, 37.0, 30.0, 35.0, 50.0, 46.0, 41.0, 48.0, 39.0, 43.0, 34.0, 31.0, 42.0, 33.0, 34.0, 17.0, 24.0, 13.0, 14.0, 14.0, 8.0, 12.0, 8.0, 10.0, 11.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-12.6796875, -12.296142578125, -11.91259765625, -11.529052734375, -11.1455078125, -10.761962890625, -10.37841796875, -9.994873046875, -9.611328125, -9.227783203125, -8.84423828125, -8.460693359375, -8.0771484375, -7.693603515625, -7.31005859375, -6.926513671875, -6.54296875, -6.159423828125, -5.77587890625, -5.392333984375, -5.0087890625, -4.625244140625, -4.24169921875, -3.858154296875, -3.474609375, -3.091064453125, -2.70751953125, -2.323974609375, -1.9404296875, -1.556884765625, -1.17333984375, -0.789794921875, -0.40625, -0.022705078125, 0.36083984375, 0.744384765625, 1.1279296875, 1.511474609375, 1.89501953125, 2.278564453125, 2.662109375, 3.045654296875, 3.42919921875, 3.812744140625, 4.1962890625, 4.579833984375, 4.96337890625, 5.346923828125, 5.73046875, 6.114013671875, 6.49755859375, 6.881103515625, 7.2646484375, 7.648193359375, 8.03173828125, 8.415283203125, 8.798828125, 9.182373046875, 9.56591796875, 9.949462890625, 10.3330078125, 10.716552734375, 11.10009765625, 11.483642578125, 11.8671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 13.0, 34.0, 39.0, 76.0, 101.0, 154.0, 266.0, 420.0, 672.0, 1039.0, 1728.0, 2711.0, 4305.0, 6800.0, 10900.0, 17019.0, 25818.0, 38347.0, 54479.0, 73463.0, 92835.0, 108410.0, 115567.0, 113601.0, 100482.0, 82255.0, 63117.0, 45733.0, 30875.0, 20802.0, 13420.0, 8683.0, 5537.0, 3328.0, 2071.0, 1292.0, 837.0, 462.0, 327.0, 195.0, 123.0, 78.0, 54.0, 30.0, 19.0, 22.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.71484375, -4.57080078125, -4.4267578125, -4.28271484375, -4.138671875, -3.99462890625, -3.8505859375, -3.70654296875, -3.5625, -3.41845703125, -3.2744140625, -3.13037109375, -2.986328125, -2.84228515625, -2.6982421875, -2.55419921875, -2.41015625, -2.26611328125, -2.1220703125, -1.97802734375, -1.833984375, -1.68994140625, -1.5458984375, -1.40185546875, -1.2578125, -1.11376953125, -0.9697265625, -0.82568359375, -0.681640625, -0.53759765625, -0.3935546875, -0.24951171875, -0.10546875, 0.03857421875, 0.1826171875, 0.32666015625, 0.470703125, 0.61474609375, 0.7587890625, 0.90283203125, 1.046875, 1.19091796875, 1.3349609375, 1.47900390625, 1.623046875, 1.76708984375, 1.9111328125, 2.05517578125, 2.19921875, 2.34326171875, 2.4873046875, 2.63134765625, 2.775390625, 2.91943359375, 3.0634765625, 3.20751953125, 3.3515625, 3.49560546875, 3.6396484375, 3.78369140625, 3.927734375, 4.07177734375, 4.2158203125, 4.35986328125, 4.50390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 9.0, 3.0, 5.0, 14.0, 9.0, 15.0, 12.0, 20.0, 17.0, 27.0, 26.0, 30.0, 33.0, 46.0, 32.0, 59.0, 43.0, 59.0, 46.0, 50.0, 50.0, 47.0, 33.0, 46.0, 33.0, 31.0, 36.0, 30.0, 26.0, 19.0, 18.0, 19.0, 9.0, 10.0, 8.0, 2.0, 6.0, 4.0, 0.0, 1.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006513595581054688, -0.0006326362490653992, -0.0006139129400253296, -0.00059518963098526, -0.0005764663219451904, -0.0005577430129051208, -0.0005390197038650513, -0.0005202963948249817, -0.0005015730857849121, -0.00048284977674484253, -0.00046412646770477295, -0.00044540315866470337, -0.0004266798496246338, -0.0004079565405845642, -0.00038923323154449463, -0.00037050992250442505, -0.00035178661346435547, -0.0003330633044242859, -0.0003143399953842163, -0.00029561668634414673, -0.00027689337730407715, -0.00025817006826400757, -0.000239446759223938, -0.0002207234501838684, -0.00020200014114379883, -0.00018327683210372925, -0.00016455352306365967, -0.0001458302140235901, -0.0001271069049835205, -0.00010838359594345093, -8.966028690338135e-05, -7.093697786331177e-05, -5.221366882324219e-05, -3.349035978317261e-05, -1.4767050743103027e-05, 3.956258296966553e-06, 2.2679567337036133e-05, 4.140287637710571e-05, 6.012618541717529e-05, 7.884949445724487e-05, 9.757280349731445e-05, 0.00011629611253738403, 0.0001350194215774536, 0.0001537427306175232, 0.00017246603965759277, 0.00019118934869766235, 0.00020991265773773193, 0.00022863596677780151, 0.0002473592758178711, 0.0002660825848579407, 0.00028480589389801025, 0.00030352920293807983, 0.0003222525119781494, 0.000340975821018219, 0.0003596991300582886, 0.00037842243909835815, 0.00039714574813842773, 0.0004158690571784973, 0.0004345923662185669, 0.0004533156752586365, 0.00047203898429870605, 0.0004907622933387756, 0.0005094856023788452, 0.0005282089114189148, 0.0005469322204589844]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 15.0, 16.0, 43.0, 66.0, 69.0, 136.0, 184.0, 297.0, 428.0, 637.0, 974.0, 1552.0, 2324.0, 3375.0, 5107.0, 7508.0, 11014.0, 15795.0, 22678.0, 31452.0, 42251.0, 55128.0, 69354.0, 82251.0, 92109.0, 97585.0, 95765.0, 89448.0, 77447.0, 64147.0, 49945.0, 38477.0, 27752.0, 20023.0, 13884.0, 9604.0, 6541.0, 4478.0, 2963.0, 1952.0, 1266.0, 872.0, 567.0, 363.0, 261.0, 163.0, 99.0, 66.0, 44.0, 28.0, 15.0, 20.0, 6.0, 4.0, 5.0], "bins": [-4.4296875, -4.302459716796875, -4.17523193359375, -4.048004150390625, -3.9207763671875, -3.793548583984375, -3.66632080078125, -3.539093017578125, -3.411865234375, -3.284637451171875, -3.15740966796875, -3.030181884765625, -2.9029541015625, -2.775726318359375, -2.64849853515625, -2.521270751953125, -2.39404296875, -2.266815185546875, -2.13958740234375, -2.012359619140625, -1.8851318359375, -1.757904052734375, -1.63067626953125, -1.503448486328125, -1.376220703125, -1.248992919921875, -1.12176513671875, -0.994537353515625, -0.8673095703125, -0.740081787109375, -0.61285400390625, -0.485626220703125, -0.3583984375, -0.231170654296875, -0.10394287109375, 0.023284912109375, 0.1505126953125, 0.277740478515625, 0.40496826171875, 0.532196044921875, 0.659423828125, 0.786651611328125, 0.91387939453125, 1.041107177734375, 1.1683349609375, 1.295562744140625, 1.42279052734375, 1.550018310546875, 1.67724609375, 1.804473876953125, 1.93170166015625, 2.058929443359375, 2.1861572265625, 2.313385009765625, 2.44061279296875, 2.567840576171875, 2.695068359375, 2.822296142578125, 2.94952392578125, 3.076751708984375, 3.2039794921875, 3.331207275390625, 3.45843505859375, 3.585662841796875, 3.712890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 0.0, 2.0, 4.0, 6.0, 5.0, 11.0, 10.0, 9.0, 14.0, 14.0, 26.0, 24.0, 19.0, 38.0, 30.0, 37.0, 32.0, 30.0, 38.0, 46.0, 39.0, 45.0, 48.0, 39.0, 47.0, 37.0, 44.0, 26.0, 42.0, 28.0, 34.0, 26.0, 26.0, 16.0, 17.0, 15.0, 12.0, 13.0, 7.0, 13.0, 8.0, 7.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.001953125, -1.94000244140625, -1.8780517578125, -1.81610107421875, -1.754150390625, -1.69219970703125, -1.6302490234375, -1.56829833984375, -1.50634765625, -1.44439697265625, -1.3824462890625, -1.32049560546875, -1.258544921875, -1.19659423828125, -1.1346435546875, -1.07269287109375, -1.0107421875, -0.94879150390625, -0.8868408203125, -0.82489013671875, -0.762939453125, -0.70098876953125, -0.6390380859375, -0.57708740234375, -0.51513671875, -0.45318603515625, -0.3912353515625, -0.32928466796875, -0.267333984375, -0.20538330078125, -0.1434326171875, -0.08148193359375, -0.01953125, 0.04241943359375, 0.1043701171875, 0.16632080078125, 0.228271484375, 0.29022216796875, 0.3521728515625, 0.41412353515625, 0.47607421875, 0.53802490234375, 0.5999755859375, 0.66192626953125, 0.723876953125, 0.78582763671875, 0.8477783203125, 0.90972900390625, 0.9716796875, 1.03363037109375, 1.0955810546875, 1.15753173828125, 1.219482421875, 1.28143310546875, 1.3433837890625, 1.40533447265625, 1.46728515625, 1.52923583984375, 1.5911865234375, 1.65313720703125, 1.715087890625, 1.77703857421875, 1.8389892578125, 1.90093994140625, 1.962890625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 8.0, 12.0, 15.0, 19.0, 32.0, 28.0, 26.0, 33.0, 31.0, 26.0, 38.0, 44.0, 48.0, 46.0, 52.0, 42.0, 61.0, 46.0, 45.0, 52.0, 35.0, 36.0, 31.0, 29.0, 29.0, 26.0, 27.0, 9.0, 20.0, 16.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.49630355834961, -18.811979293823242, -18.127655029296875, -17.443328857421875, -16.759004592895508, -16.07468032836914, -15.390355110168457, -14.706029891967773, -14.021705627441406, -13.337381362915039, -12.653056144714355, -11.968730926513672, -11.284406661987305, -10.600082397460938, -9.915757179260254, -9.23143196105957, -8.547107696533203, -7.862782955169678, -7.178458213806152, -6.494133472442627, -5.809808731079102, -5.125483989715576, -4.441159248352051, -3.7568345069885254, -3.072509765625, -2.3881850242614746, -1.7038602828979492, -1.0195355415344238, -0.33521080017089844, 0.34911394119262695, 1.0334386825561523, 1.7177634239196777, 2.402090072631836, 3.0864148139953613, 3.7707395553588867, 4.455064296722412, 5.1393890380859375, 5.823713779449463, 6.508038520812988, 7.192363262176514, 7.876688003540039, 8.561012268066406, 9.24533748626709, 9.929662704467773, 10.61398696899414, 11.298311233520508, 11.982636451721191, 12.666961669921875, 13.351285934448242, 14.03561019897461, 14.719935417175293, 15.404260635375977, 16.088584899902344, 16.77290916442871, 17.457233428955078, 18.141559600830078, 18.825883865356445, 19.510208129882812, 20.194534301757812, 20.87885856628418, 21.563182830810547, 22.247507095336914, 22.93183135986328, 23.61615753173828, 24.30048179626465]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 12.0, 11.0, 7.0, 19.0, 17.0, 15.0, 22.0, 20.0, 19.0, 30.0, 25.0, 36.0, 39.0, 41.0, 38.0, 40.0, 39.0, 43.0, 42.0, 45.0, 36.0, 45.0, 33.0, 33.0, 36.0, 26.0, 38.0, 17.0, 23.0, 25.0, 20.0, 14.0, 18.0, 17.0, 14.0, 7.0, 8.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.404924392700195, -18.76725959777832, -18.129594802856445, -17.491928100585938, -16.854263305664062, -16.216598510742188, -15.578933715820312, -14.941268920898438, -14.303603172302246, -13.665938377380371, -13.02827262878418, -12.390607833862305, -11.75294303894043, -11.115277290344238, -10.477612495422363, -9.839946746826172, -9.202281951904297, -8.564617156982422, -7.9269514083862305, -7.2892866134643555, -6.651621341705322, -6.013956069946289, -5.376291275024414, -4.738626003265381, -4.100960731506348, -3.4632954597473145, -2.8256304264068604, -2.1879653930664062, -1.550300121307373, -0.9126348495483398, -0.27496981620788574, 0.36269521713256836, 1.0003585815429688, 1.6380237340927124, 2.275688886642456, 2.91335391998291, 3.5510191917419434, 4.188684463500977, 4.826349258422852, 5.464014530181885, 6.101679801940918, 6.739345073699951, 7.377010345458984, 8.01467514038086, 8.652339935302734, 9.290005683898926, 9.9276704788208, 10.565336227416992, 11.203001022338867, 11.840665817260742, 12.478331565856934, 13.115996360778809, 13.753662109375, 14.391326904296875, 15.02899169921875, 15.666656494140625, 16.3043212890625, 16.941986083984375, 17.57965087890625, 18.217317581176758, 18.854982376098633, 19.492647171020508, 20.130311965942383, 20.767976760864258, 21.405643463134766]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 13.0, 9.0, 22.0, 29.0, 48.0, 49.0, 102.0, 143.0, 242.0, 375.0, 580.0, 934.0, 1360.0, 2137.0, 3470.0, 5717.0, 9620.0, 16175.0, 27708.0, 48613.0, 84915.0, 149224.0, 254459.0, 402727.0, 563536.0, 663521.0, 633712.0, 498406.0, 337504.0, 206370.0, 118650.0, 68271.0, 39046.0, 22877.0, 13205.0, 7970.0, 4795.0, 2943.0, 1714.0, 1068.0, 719.0, 450.0, 302.0, 196.0, 112.0, 84.0, 56.0, 39.0, 27.0, 8.0, 8.0, 11.0, 5.0, 4.0, 4.0], "bins": [-17.5, -16.9970703125, -16.494140625, -15.9912109375, -15.48828125, -14.9853515625, -14.482421875, -13.9794921875, -13.4765625, -12.9736328125, -12.470703125, -11.9677734375, -11.46484375, -10.9619140625, -10.458984375, -9.9560546875, -9.453125, -8.9501953125, -8.447265625, -7.9443359375, -7.44140625, -6.9384765625, -6.435546875, -5.9326171875, -5.4296875, -4.9267578125, -4.423828125, -3.9208984375, -3.41796875, -2.9150390625, -2.412109375, -1.9091796875, -1.40625, -0.9033203125, -0.400390625, 0.1025390625, 0.60546875, 1.1083984375, 1.611328125, 2.1142578125, 2.6171875, 3.1201171875, 3.623046875, 4.1259765625, 4.62890625, 5.1318359375, 5.634765625, 6.1376953125, 6.640625, 7.1435546875, 7.646484375, 8.1494140625, 8.65234375, 9.1552734375, 9.658203125, 10.1611328125, 10.6640625, 11.1669921875, 11.669921875, 12.1728515625, 12.67578125, 13.1787109375, 13.681640625, 14.1845703125, 14.6875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 14.0, 6.0, 9.0, 6.0, 13.0, 16.0, 19.0, 22.0, 19.0, 31.0, 22.0, 35.0, 25.0, 23.0, 34.0, 54.0, 43.0, 52.0, 38.0, 37.0, 40.0, 46.0, 40.0, 33.0, 33.0, 33.0, 35.0, 24.0, 32.0, 20.0, 15.0, 16.0, 24.0, 24.0, 12.0, 7.0, 8.0, 11.0, 8.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.125, -15.568603515625, -15.01220703125, -14.455810546875, -13.8994140625, -13.343017578125, -12.78662109375, -12.230224609375, -11.673828125, -11.117431640625, -10.56103515625, -10.004638671875, -9.4482421875, -8.891845703125, -8.33544921875, -7.779052734375, -7.22265625, -6.666259765625, -6.10986328125, -5.553466796875, -4.9970703125, -4.440673828125, -3.88427734375, -3.327880859375, -2.771484375, -2.215087890625, -1.65869140625, -1.102294921875, -0.5458984375, 0.010498046875, 0.56689453125, 1.123291015625, 1.6796875, 2.236083984375, 2.79248046875, 3.348876953125, 3.9052734375, 4.461669921875, 5.01806640625, 5.574462890625, 6.130859375, 6.687255859375, 7.24365234375, 7.800048828125, 8.3564453125, 8.912841796875, 9.46923828125, 10.025634765625, 10.58203125, 11.138427734375, 11.69482421875, 12.251220703125, 12.8076171875, 13.364013671875, 13.92041015625, 14.476806640625, 15.033203125, 15.589599609375, 16.14599609375, 16.702392578125, 17.2587890625, 17.815185546875, 18.37158203125, 18.927978515625, 19.484375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 11.0, 3.0, 12.0, 17.0, 27.0, 49.0, 75.0, 130.0, 265.0, 378.0, 640.0, 1080.0, 1761.0, 3057.0, 5127.0, 8402.0, 14273.0, 24067.0, 40580.0, 68832.0, 115492.0, 190819.0, 301629.0, 440631.0, 569435.0, 625889.0, 568999.0, 438436.0, 300954.0, 190374.0, 115369.0, 68146.0, 40408.0, 23816.0, 14209.0, 8294.0, 4974.0, 2988.0, 1868.0, 1088.0, 659.0, 390.0, 269.0, 155.0, 93.0, 44.0, 41.0, 14.0, 12.0, 4.0, 1.0, 5.0, 3.0, 1.0], "bins": [-20.3125, -19.740234375, -19.16796875, -18.595703125, -18.0234375, -17.451171875, -16.87890625, -16.306640625, -15.734375, -15.162109375, -14.58984375, -14.017578125, -13.4453125, -12.873046875, -12.30078125, -11.728515625, -11.15625, -10.583984375, -10.01171875, -9.439453125, -8.8671875, -8.294921875, -7.72265625, -7.150390625, -6.578125, -6.005859375, -5.43359375, -4.861328125, -4.2890625, -3.716796875, -3.14453125, -2.572265625, -2.0, -1.427734375, -0.85546875, -0.283203125, 0.2890625, 0.861328125, 1.43359375, 2.005859375, 2.578125, 3.150390625, 3.72265625, 4.294921875, 4.8671875, 5.439453125, 6.01171875, 6.583984375, 7.15625, 7.728515625, 8.30078125, 8.873046875, 9.4453125, 10.017578125, 10.58984375, 11.162109375, 11.734375, 12.306640625, 12.87890625, 13.451171875, 14.0234375, 14.595703125, 15.16796875, 15.740234375, 16.3125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 12.0, 11.0, 10.0, 8.0, 19.0, 16.0, 31.0, 37.0, 41.0, 37.0, 37.0, 71.0, 87.0, 120.0, 115.0, 104.0, 134.0, 167.0, 165.0, 189.0, 190.0, 170.0, 201.0, 201.0, 200.0, 196.0, 204.0, 193.0, 166.0, 142.0, 118.0, 110.0, 108.0, 71.0, 62.0, 64.0, 49.0, 45.0, 29.0, 40.0, 26.0, 11.0, 17.0, 9.0, 9.0, 11.0, 7.0, 3.0, 3.0, 5.0, 2.0, 3.0], "bins": [-7.46875, -7.25555419921875, -7.0423583984375, -6.82916259765625, -6.615966796875, -6.40277099609375, -6.1895751953125, -5.97637939453125, -5.76318359375, -5.54998779296875, -5.3367919921875, -5.12359619140625, -4.910400390625, -4.69720458984375, -4.4840087890625, -4.27081298828125, -4.0576171875, -3.84442138671875, -3.6312255859375, -3.41802978515625, -3.204833984375, -2.99163818359375, -2.7784423828125, -2.56524658203125, -2.35205078125, -2.13885498046875, -1.9256591796875, -1.71246337890625, -1.499267578125, -1.28607177734375, -1.0728759765625, -0.85968017578125, -0.646484375, -0.43328857421875, -0.2200927734375, -0.00689697265625, 0.206298828125, 0.41949462890625, 0.6326904296875, 0.84588623046875, 1.05908203125, 1.27227783203125, 1.4854736328125, 1.69866943359375, 1.911865234375, 2.12506103515625, 2.3382568359375, 2.55145263671875, 2.7646484375, 2.97784423828125, 3.1910400390625, 3.40423583984375, 3.617431640625, 3.83062744140625, 4.0438232421875, 4.25701904296875, 4.47021484375, 4.68341064453125, 4.8966064453125, 5.10980224609375, 5.322998046875, 5.53619384765625, 5.7493896484375, 5.96258544921875, 6.17578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 10.0, 9.0, 16.0, 18.0, 17.0, 18.0, 22.0, 31.0, 43.0, 28.0, 39.0, 34.0, 44.0, 55.0, 64.0, 52.0, 41.0, 50.0, 49.0, 50.0, 46.0, 37.0, 32.0, 28.0, 33.0, 24.0, 20.0, 16.0, 11.0, 14.0, 9.0, 4.0, 7.0, 4.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.23534393310547, -22.53009033203125, -21.82483673095703, -21.119583129882812, -20.41432762145996, -19.709074020385742, -19.003820419311523, -18.298566818237305, -17.593311309814453, -16.888057708740234, -16.182804107666016, -15.47754955291748, -14.772294998168945, -14.067041397094727, -13.361787796020508, -12.656534194946289, -11.95128059387207, -11.246026992797852, -10.540772438049316, -9.835518836975098, -9.130264282226562, -8.425010681152344, -7.719757080078125, -7.014503002166748, -6.309248924255371, -5.603994846343994, -4.898740768432617, -4.193487167358398, -3.4882330894470215, -2.7829790115356445, -2.077725410461426, -1.3724713325500488, -0.6672191619873047, 0.038034796714782715, 0.7432887554168701, 1.448542594909668, 2.153796672821045, 2.859050750732422, 3.5643043518066406, 4.269558429718018, 4.9748125076293945, 5.6800665855407715, 6.385320663452148, 7.090574264526367, 7.795828342437744, 8.501082420349121, 9.20633602142334, 9.911590576171875, 10.616844177246094, 11.322097778320312, 12.027352333068848, 12.732605934143066, 13.437860488891602, 14.14311408996582, 14.848367691040039, 15.553621292114258, 16.25887680053711, 16.964130401611328, 17.669384002685547, 18.374637603759766, 19.079893112182617, 19.785146713256836, 20.490400314331055, 21.195653915405273, 21.900907516479492]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 9.0, 6.0, 7.0, 9.0, 10.0, 15.0, 15.0, 17.0, 21.0, 29.0, 26.0, 28.0, 37.0, 29.0, 46.0, 42.0, 34.0, 47.0, 42.0, 36.0, 36.0, 41.0, 36.0, 41.0, 34.0, 35.0, 40.0, 33.0, 29.0, 14.0, 23.0, 12.0, 16.0, 19.0, 10.0, 16.0, 17.0, 8.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.522321701049805, -16.929426193237305, -16.336528778076172, -15.743633270263672, -15.150737762451172, -14.557841300964355, -13.964944839477539, -13.372049331665039, -12.779152870178223, -12.186256408691406, -11.593360900878906, -11.00046443939209, -10.407567977905273, -9.814672470092773, -9.221776008605957, -8.62887954711914, -8.03598403930664, -7.443088054656982, -6.850192070007324, -6.257295608520508, -5.66439962387085, -5.071503639221191, -4.478607177734375, -3.885711193084717, -3.2928152084350586, -2.6999192237854004, -2.107023000717163, -1.5141268968582153, -0.9212307929992676, -0.3283348083496094, 0.26456141471862793, 0.8574576377868652, 1.4503555297851562, 2.0432515144348145, 2.6361477375030518, 3.229043960571289, 3.8219399452209473, 4.4148359298706055, 5.007732391357422, 5.60062837600708, 6.193524360656738, 6.7864203453063965, 7.379316329956055, 7.972212791442871, 8.565109252929688, 9.158004760742188, 9.750901222229004, 10.34379768371582, 10.93669319152832, 11.529589653015137, 12.122485160827637, 12.715381622314453, 13.308277130126953, 13.90117359161377, 14.494070053100586, 15.086965560913086, 15.679862022399902, 16.27275848388672, 16.86565399169922, 17.45854949951172, 18.05144691467285, 18.64434242248535, 19.23723793029785, 19.830135345458984, 20.423030853271484]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 22.0, 28.0, 54.0, 79.0, 133.0, 246.0, 484.0, 756.0, 1511.0, 2634.0, 4838.0, 8799.0, 15653.0, 27235.0, 45227.0, 72365.0, 104643.0, 134951.0, 150277.0, 143370.0, 117483.0, 84722.0, 55192.0, 33924.0, 19122.0, 11073.0, 6163.0, 3333.0, 1818.0, 1048.0, 565.0, 330.0, 174.0, 111.0, 74.0, 32.0, 23.0, 18.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.328125, -11.939208984375, -11.55029296875, -11.161376953125, -10.7724609375, -10.383544921875, -9.99462890625, -9.605712890625, -9.216796875, -8.827880859375, -8.43896484375, -8.050048828125, -7.6611328125, -7.272216796875, -6.88330078125, -6.494384765625, -6.10546875, -5.716552734375, -5.32763671875, -4.938720703125, -4.5498046875, -4.160888671875, -3.77197265625, -3.383056640625, -2.994140625, -2.605224609375, -2.21630859375, -1.827392578125, -1.4384765625, -1.049560546875, -0.66064453125, -0.271728515625, 0.1171875, 0.506103515625, 0.89501953125, 1.283935546875, 1.6728515625, 2.061767578125, 2.45068359375, 2.839599609375, 3.228515625, 3.617431640625, 4.00634765625, 4.395263671875, 4.7841796875, 5.173095703125, 5.56201171875, 5.950927734375, 6.33984375, 6.728759765625, 7.11767578125, 7.506591796875, 7.8955078125, 8.284423828125, 8.67333984375, 9.062255859375, 9.451171875, 9.840087890625, 10.22900390625, 10.617919921875, 11.0068359375, 11.395751953125, 11.78466796875, 12.173583984375, 12.5625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 4.0, 1.0, 5.0, 5.0, 6.0, 6.0, 7.0, 4.0, 12.0, 10.0, 15.0, 9.0, 17.0, 22.0, 25.0, 25.0, 30.0, 23.0, 35.0, 42.0, 45.0, 33.0, 40.0, 37.0, 43.0, 40.0, 45.0, 47.0, 31.0, 27.0, 38.0, 33.0, 34.0, 30.0, 27.0, 28.0, 18.0, 15.0, 11.0, 14.0, 14.0, 13.0, 12.0, 10.0, 6.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.439697265625, -15.83251953125, -15.225341796875, -14.6181640625, -14.010986328125, -13.40380859375, -12.796630859375, -12.189453125, -11.582275390625, -10.97509765625, -10.367919921875, -9.7607421875, -9.153564453125, -8.54638671875, -7.939208984375, -7.33203125, -6.724853515625, -6.11767578125, -5.510498046875, -4.9033203125, -4.296142578125, -3.68896484375, -3.081787109375, -2.474609375, -1.867431640625, -1.26025390625, -0.653076171875, -0.0458984375, 0.561279296875, 1.16845703125, 1.775634765625, 2.3828125, 2.989990234375, 3.59716796875, 4.204345703125, 4.8115234375, 5.418701171875, 6.02587890625, 6.633056640625, 7.240234375, 7.847412109375, 8.45458984375, 9.061767578125, 9.6689453125, 10.276123046875, 10.88330078125, 11.490478515625, 12.09765625, 12.704833984375, 13.31201171875, 13.919189453125, 14.5263671875, 15.133544921875, 15.74072265625, 16.347900390625, 16.955078125, 17.562255859375, 18.16943359375, 18.776611328125, 19.3837890625, 19.990966796875, 20.59814453125, 21.205322265625, 21.8125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 16.0, 28.0, 37.0, 52.0, 81.0, 135.0, 188.0, 282.0, 466.0, 646.0, 1130.0, 1863.0, 2970.0, 5122.0, 8502.0, 14723.0, 25482.0, 42466.0, 69447.0, 107016.0, 146469.0, 166748.0, 151508.0, 114133.0, 75065.0, 47028.0, 27489.0, 16180.0, 9380.0, 5563.0, 3181.0, 2027.0, 1132.0, 690.0, 456.0, 276.0, 190.0, 120.0, 76.0, 54.0, 42.0, 29.0, 17.0, 12.0, 17.0, 6.0, 2.0, 0.0, 5.0, 1.0, 2.0, 3.0], "bins": [-16.5, -16.0086669921875, -15.517333984375, -15.0260009765625, -14.53466796875, -14.0433349609375, -13.552001953125, -13.0606689453125, -12.5693359375, -12.0780029296875, -11.586669921875, -11.0953369140625, -10.60400390625, -10.1126708984375, -9.621337890625, -9.1300048828125, -8.638671875, -8.1473388671875, -7.656005859375, -7.1646728515625, -6.67333984375, -6.1820068359375, -5.690673828125, -5.1993408203125, -4.7080078125, -4.2166748046875, -3.725341796875, -3.2340087890625, -2.74267578125, -2.2513427734375, -1.760009765625, -1.2686767578125, -0.77734375, -0.2860107421875, 0.205322265625, 0.6966552734375, 1.18798828125, 1.6793212890625, 2.170654296875, 2.6619873046875, 3.1533203125, 3.6446533203125, 4.135986328125, 4.6273193359375, 5.11865234375, 5.6099853515625, 6.101318359375, 6.5926513671875, 7.083984375, 7.5753173828125, 8.066650390625, 8.5579833984375, 9.04931640625, 9.5406494140625, 10.031982421875, 10.5233154296875, 11.0146484375, 11.5059814453125, 11.997314453125, 12.4886474609375, 12.97998046875, 13.4713134765625, 13.962646484375, 14.4539794921875, 14.9453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 6.0, 6.0, 5.0, 4.0, 11.0, 13.0, 14.0, 16.0, 24.0, 18.0, 17.0, 30.0, 35.0, 28.0, 35.0, 31.0, 38.0, 28.0, 48.0, 44.0, 45.0, 31.0, 38.0, 37.0, 45.0, 41.0, 38.0, 34.0, 31.0, 29.0, 26.0, 21.0, 24.0, 19.0, 14.0, 12.0, 4.0, 14.0, 6.0, 8.0, 9.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0], "bins": [-14.0546875, -13.669921875, -13.28515625, -12.900390625, -12.515625, -12.130859375, -11.74609375, -11.361328125, -10.9765625, -10.591796875, -10.20703125, -9.822265625, -9.4375, -9.052734375, -8.66796875, -8.283203125, -7.8984375, -7.513671875, -7.12890625, -6.744140625, -6.359375, -5.974609375, -5.58984375, -5.205078125, -4.8203125, -4.435546875, -4.05078125, -3.666015625, -3.28125, -2.896484375, -2.51171875, -2.126953125, -1.7421875, -1.357421875, -0.97265625, -0.587890625, -0.203125, 0.181640625, 0.56640625, 0.951171875, 1.3359375, 1.720703125, 2.10546875, 2.490234375, 2.875, 3.259765625, 3.64453125, 4.029296875, 4.4140625, 4.798828125, 5.18359375, 5.568359375, 5.953125, 6.337890625, 6.72265625, 7.107421875, 7.4921875, 7.876953125, 8.26171875, 8.646484375, 9.03125, 9.416015625, 9.80078125, 10.185546875, 10.5703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 9.0, 21.0, 35.0, 42.0, 55.0, 94.0, 153.0, 264.0, 434.0, 709.0, 1224.0, 2132.0, 3802.0, 7023.0, 12474.0, 23085.0, 41969.0, 76966.0, 130251.0, 184257.0, 197246.0, 152361.0, 95382.0, 53789.0, 29130.0, 15839.0, 8549.0, 4789.0, 2686.0, 1552.0, 868.0, 554.0, 309.0, 173.0, 108.0, 70.0, 54.0, 36.0, 19.0, 15.0, 5.0, 8.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5, -8.2359619140625, -7.971923828125, -7.7078857421875, -7.44384765625, -7.1798095703125, -6.915771484375, -6.6517333984375, -6.3876953125, -6.1236572265625, -5.859619140625, -5.5955810546875, -5.33154296875, -5.0675048828125, -4.803466796875, -4.5394287109375, -4.275390625, -4.0113525390625, -3.747314453125, -3.4832763671875, -3.21923828125, -2.9552001953125, -2.691162109375, -2.4271240234375, -2.1630859375, -1.8990478515625, -1.635009765625, -1.3709716796875, -1.10693359375, -0.8428955078125, -0.578857421875, -0.3148193359375, -0.05078125, 0.2132568359375, 0.477294921875, 0.7413330078125, 1.00537109375, 1.2694091796875, 1.533447265625, 1.7974853515625, 2.0615234375, 2.3255615234375, 2.589599609375, 2.8536376953125, 3.11767578125, 3.3817138671875, 3.645751953125, 3.9097900390625, 4.173828125, 4.4378662109375, 4.701904296875, 4.9659423828125, 5.22998046875, 5.4940185546875, 5.758056640625, 6.0220947265625, 6.2861328125, 6.5501708984375, 6.814208984375, 7.0782470703125, 7.34228515625, 7.6063232421875, 7.870361328125, 8.1343994140625, 8.3984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 2.0, 6.0, 11.0, 11.0, 21.0, 22.0, 23.0, 31.0, 34.0, 25.0, 46.0, 48.0, 44.0, 52.0, 47.0, 66.0, 50.0, 58.0, 60.0, 55.0, 52.0, 58.0, 27.0, 28.0, 19.0, 17.0, 20.0, 9.0, 6.0, 13.0, 4.0, 6.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.0005269050598144531, -0.0005116760730743408, -0.0004964470863342285, -0.0004812180995941162, -0.0004659891128540039, -0.0004507601261138916, -0.0004355311393737793, -0.000420302152633667, -0.0004050731658935547, -0.0003898441791534424, -0.0003746151924133301, -0.0003593862056732178, -0.00034415721893310547, -0.00032892823219299316, -0.00031369924545288086, -0.00029847025871276855, -0.00028324127197265625, -0.00026801228523254395, -0.00025278329849243164, -0.00023755431175231934, -0.00022232532501220703, -0.00020709633827209473, -0.00019186735153198242, -0.00017663836479187012, -0.0001614093780517578, -0.0001461803913116455, -0.0001309514045715332, -0.0001157224178314209, -0.0001004934310913086, -8.526444435119629e-05, -7.003545761108398e-05, -5.480647087097168e-05, -3.9577484130859375e-05, -2.434849739074707e-05, -9.119510650634766e-06, 6.109476089477539e-06, 2.1338462829589844e-05, 3.656744956970215e-05, 5.179643630981445e-05, 6.702542304992676e-05, 8.225440979003906e-05, 9.748339653015137e-05, 0.00011271238327026367, 0.00012794137001037598, 0.00014317035675048828, 0.00015839934349060059, 0.0001736283302307129, 0.0001888573169708252, 0.0002040863037109375, 0.0002193152904510498, 0.0002345442771911621, 0.0002497732639312744, 0.0002650022506713867, 0.000280231237411499, 0.00029546022415161133, 0.00031068921089172363, 0.00032591819763183594, 0.00034114718437194824, 0.00035637617111206055, 0.00037160515785217285, 0.00038683414459228516, 0.00040206313133239746, 0.00041729211807250977, 0.00043252110481262207, 0.0004477500915527344]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 8.0, 6.0, 19.0, 25.0, 43.0, 46.0, 84.0, 138.0, 201.0, 321.0, 517.0, 811.0, 1308.0, 2116.0, 3136.0, 5075.0, 8131.0, 13041.0, 20542.0, 32404.0, 49078.0, 71487.0, 96968.0, 120694.0, 133987.0, 128883.0, 109048.0, 82948.0, 58821.0, 39576.0, 25590.0, 16153.0, 10246.0, 6288.0, 4038.0, 2538.0, 1500.0, 987.0, 643.0, 393.0, 258.0, 146.0, 113.0, 76.0, 37.0, 23.0, 17.0, 10.0, 11.0, 7.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-7.58203125, -7.35040283203125, -7.1187744140625, -6.88714599609375, -6.655517578125, -6.42388916015625, -6.1922607421875, -5.96063232421875, -5.72900390625, -5.49737548828125, -5.2657470703125, -5.03411865234375, -4.802490234375, -4.57086181640625, -4.3392333984375, -4.10760498046875, -3.8759765625, -3.64434814453125, -3.4127197265625, -3.18109130859375, -2.949462890625, -2.71783447265625, -2.4862060546875, -2.25457763671875, -2.02294921875, -1.79132080078125, -1.5596923828125, -1.32806396484375, -1.096435546875, -0.86480712890625, -0.6331787109375, -0.40155029296875, -0.169921875, 0.06170654296875, 0.2933349609375, 0.52496337890625, 0.756591796875, 0.98822021484375, 1.2198486328125, 1.45147705078125, 1.68310546875, 1.91473388671875, 2.1463623046875, 2.37799072265625, 2.609619140625, 2.84124755859375, 3.0728759765625, 3.30450439453125, 3.5361328125, 3.76776123046875, 3.9993896484375, 4.23101806640625, 4.462646484375, 4.69427490234375, 4.9259033203125, 5.15753173828125, 5.38916015625, 5.62078857421875, 5.8524169921875, 6.08404541015625, 6.315673828125, 6.54730224609375, 6.7789306640625, 7.01055908203125, 7.2421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 12.0, 5.0, 13.0, 10.0, 10.0, 18.0, 33.0, 21.0, 34.0, 34.0, 47.0, 40.0, 43.0, 61.0, 55.0, 52.0, 60.0, 55.0, 54.0, 44.0, 38.0, 41.0, 34.0, 45.0, 29.0, 17.0, 27.0, 11.0, 9.0, 8.0, 4.0, 8.0, 0.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.255859375, -3.15716552734375, -3.0584716796875, -2.95977783203125, -2.861083984375, -2.76239013671875, -2.6636962890625, -2.56500244140625, -2.46630859375, -2.36761474609375, -2.2689208984375, -2.17022705078125, -2.071533203125, -1.97283935546875, -1.8741455078125, -1.77545166015625, -1.6767578125, -1.57806396484375, -1.4793701171875, -1.38067626953125, -1.281982421875, -1.18328857421875, -1.0845947265625, -0.98590087890625, -0.88720703125, -0.78851318359375, -0.6898193359375, -0.59112548828125, -0.492431640625, -0.39373779296875, -0.2950439453125, -0.19635009765625, -0.09765625, 0.00103759765625, 0.0997314453125, 0.19842529296875, 0.297119140625, 0.39581298828125, 0.4945068359375, 0.59320068359375, 0.69189453125, 0.79058837890625, 0.8892822265625, 0.98797607421875, 1.086669921875, 1.18536376953125, 1.2840576171875, 1.38275146484375, 1.4814453125, 1.58013916015625, 1.6788330078125, 1.77752685546875, 1.876220703125, 1.97491455078125, 2.0736083984375, 2.17230224609375, 2.27099609375, 2.36968994140625, 2.4683837890625, 2.56707763671875, 2.665771484375, 2.76446533203125, 2.8631591796875, 2.96185302734375, 3.060546875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 9.0, 5.0, 11.0, 15.0, 20.0, 10.0, 17.0, 21.0, 23.0, 23.0, 24.0, 39.0, 40.0, 41.0, 35.0, 51.0, 67.0, 42.0, 45.0, 44.0, 54.0, 44.0, 46.0, 43.0, 33.0, 32.0, 22.0, 18.0, 21.0, 22.0, 15.0, 20.0, 12.0, 9.0, 9.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.479982376098633, -20.81294059753418, -20.145898818969727, -19.478857040405273, -18.811817169189453, -18.144775390625, -17.477733612060547, -16.810691833496094, -16.14365005493164, -15.476608276367188, -14.809566497802734, -14.142525672912598, -13.475483894348145, -12.808442115783691, -12.141401290893555, -11.474359512329102, -10.807317733764648, -10.140275955200195, -9.473234176635742, -8.806193351745605, -8.139151573181152, -7.472109794616699, -6.805068492889404, -6.138027191162109, -5.470985412597656, -4.803943634033203, -4.136902332305908, -3.469860792160034, -2.80281925201416, -2.135777711868286, -1.468736171722412, -0.8016948699951172, -0.13465309143066406, 0.53238844871521, 1.199429988861084, 1.866471529006958, 2.533513069152832, 3.200554609298706, 3.86759614944458, 4.534637451171875, 5.201679229736328, 5.868721008300781, 6.535762310028076, 7.202803611755371, 7.869845390319824, 8.536887168884277, 9.203927993774414, 9.870969772338867, 10.53801155090332, 11.205053329467773, 11.872095108032227, 12.539135932922363, 13.206177711486816, 13.87321949005127, 14.540260314941406, 15.20730209350586, 15.874343872070312, 16.541385650634766, 17.20842742919922, 17.875469207763672, 18.542510986328125, 19.209550857543945, 19.8765926361084, 20.54363441467285, 21.210676193237305]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 6.0, 3.0, 5.0, 4.0, 6.0, 10.0, 9.0, 4.0, 8.0, 10.0, 18.0, 17.0, 22.0, 18.0, 25.0, 30.0, 32.0, 34.0, 38.0, 43.0, 41.0, 39.0, 44.0, 40.0, 43.0, 39.0, 38.0, 38.0, 40.0, 44.0, 28.0, 45.0, 21.0, 21.0, 18.0, 20.0, 15.0, 19.0, 14.0, 15.0, 14.0, 10.0, 7.0, 2.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.20357894897461, -16.610828399658203, -16.018075942993164, -15.425325393676758, -14.832573890686035, -14.239822387695312, -13.647071838378906, -13.054320335388184, -12.461568832397461, -11.868817329406738, -11.276065826416016, -10.68331527709961, -10.090563774108887, -9.497812271118164, -8.905061721801758, -8.312310218811035, -7.7195587158203125, -7.12680721282959, -6.534056186676025, -5.941305160522461, -5.348553657531738, -4.755802154541016, -4.163051128387451, -3.5703001022338867, -2.977548599243164, -2.3847973346710205, -1.792046070098877, -1.1992948055267334, -0.6065435409545898, -0.013792276382446289, 0.5789589881896973, 1.1717100143432617, 1.7644615173339844, 2.357212781906128, 2.9499640464782715, 3.542715311050415, 4.135466575622559, 4.728218078613281, 5.320969104766846, 5.91372013092041, 6.506471633911133, 7.0992231369018555, 7.69197416305542, 8.284725189208984, 8.877476692199707, 9.47022819519043, 10.062978744506836, 10.655730247497559, 11.248481750488281, 11.841233253479004, 12.433984756469727, 13.026735305786133, 13.619486808776855, 14.212238311767578, 14.804988861083984, 15.397740364074707, 15.99049186706543, 16.583242416381836, 17.175994873046875, 17.76874542236328, 18.361495971679688, 18.954248428344727, 19.546998977661133, 20.139751434326172, 20.732501983642578]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 10.0, 12.0, 19.0, 37.0, 55.0, 79.0, 114.0, 176.0, 282.0, 421.0, 670.0, 992.0, 1490.0, 2371.0, 3664.0, 5334.0, 7989.0, 11682.0, 17289.0, 24537.0, 34229.0, 45124.0, 58536.0, 72549.0, 85496.0, 94294.0, 98321.0, 95686.0, 86905.0, 74661.0, 60824.0, 47711.0, 35163.0, 25898.0, 17977.0, 12590.0, 8636.0, 5715.0, 3741.0, 2553.0, 1605.0, 1089.0, 745.0, 461.0, 292.0, 182.0, 128.0, 80.0, 49.0, 36.0, 17.0, 19.0, 11.0, 7.0, 1.0, 4.0, 1.0], "bins": [-10.984375, -10.6572265625, -10.330078125, -10.0029296875, -9.67578125, -9.3486328125, -9.021484375, -8.6943359375, -8.3671875, -8.0400390625, -7.712890625, -7.3857421875, -7.05859375, -6.7314453125, -6.404296875, -6.0771484375, -5.75, -5.4228515625, -5.095703125, -4.7685546875, -4.44140625, -4.1142578125, -3.787109375, -3.4599609375, -3.1328125, -2.8056640625, -2.478515625, -2.1513671875, -1.82421875, -1.4970703125, -1.169921875, -0.8427734375, -0.515625, -0.1884765625, 0.138671875, 0.4658203125, 0.79296875, 1.1201171875, 1.447265625, 1.7744140625, 2.1015625, 2.4287109375, 2.755859375, 3.0830078125, 3.41015625, 3.7373046875, 4.064453125, 4.3916015625, 4.71875, 5.0458984375, 5.373046875, 5.7001953125, 6.02734375, 6.3544921875, 6.681640625, 7.0087890625, 7.3359375, 7.6630859375, 7.990234375, 8.3173828125, 8.64453125, 8.9716796875, 9.298828125, 9.6259765625, 9.953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 6.0, 7.0, 4.0, 3.0, 8.0, 10.0, 8.0, 15.0, 16.0, 20.0, 24.0, 20.0, 29.0, 25.0, 31.0, 30.0, 34.0, 40.0, 50.0, 38.0, 45.0, 35.0, 47.0, 49.0, 26.0, 42.0, 44.0, 38.0, 39.0, 29.0, 22.0, 33.0, 22.0, 17.0, 13.0, 15.0, 16.0, 15.0, 10.0, 9.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.75, -18.128173828125, -17.50634765625, -16.884521484375, -16.2626953125, -15.640869140625, -15.01904296875, -14.397216796875, -13.775390625, -13.153564453125, -12.53173828125, -11.909912109375, -11.2880859375, -10.666259765625, -10.04443359375, -9.422607421875, -8.80078125, -8.178955078125, -7.55712890625, -6.935302734375, -6.3134765625, -5.691650390625, -5.06982421875, -4.447998046875, -3.826171875, -3.204345703125, -2.58251953125, -1.960693359375, -1.3388671875, -0.717041015625, -0.09521484375, 0.526611328125, 1.1484375, 1.770263671875, 2.39208984375, 3.013916015625, 3.6357421875, 4.257568359375, 4.87939453125, 5.501220703125, 6.123046875, 6.744873046875, 7.36669921875, 7.988525390625, 8.6103515625, 9.232177734375, 9.85400390625, 10.475830078125, 11.09765625, 11.719482421875, 12.34130859375, 12.963134765625, 13.5849609375, 14.206787109375, 14.82861328125, 15.450439453125, 16.072265625, 16.694091796875, 17.31591796875, 17.937744140625, 18.5595703125, 19.181396484375, 19.80322265625, 20.425048828125, 21.046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 5.0, 8.0, 17.0, 17.0, 43.0, 66.0, 74.0, 141.0, 209.0, 318.0, 511.0, 754.0, 1216.0, 1834.0, 2858.0, 4329.0, 6487.0, 9818.0, 14903.0, 21790.0, 31500.0, 44212.0, 59248.0, 75600.0, 90758.0, 101903.0, 106474.0, 102277.0, 91495.0, 76564.0, 59497.0, 44600.0, 32361.0, 22398.0, 15033.0, 10144.0, 6611.0, 4302.0, 2818.0, 1823.0, 1187.0, 820.0, 563.0, 327.0, 208.0, 172.0, 87.0, 51.0, 46.0, 33.0, 19.0, 12.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0], "bins": [-12.390625, -12.0096435546875, -11.628662109375, -11.2476806640625, -10.86669921875, -10.4857177734375, -10.104736328125, -9.7237548828125, -9.3427734375, -8.9617919921875, -8.580810546875, -8.1998291015625, -7.81884765625, -7.4378662109375, -7.056884765625, -6.6759033203125, -6.294921875, -5.9139404296875, -5.532958984375, -5.1519775390625, -4.77099609375, -4.3900146484375, -4.009033203125, -3.6280517578125, -3.2470703125, -2.8660888671875, -2.485107421875, -2.1041259765625, -1.72314453125, -1.3421630859375, -0.961181640625, -0.5802001953125, -0.19921875, 0.1817626953125, 0.562744140625, 0.9437255859375, 1.32470703125, 1.7056884765625, 2.086669921875, 2.4676513671875, 2.8486328125, 3.2296142578125, 3.610595703125, 3.9915771484375, 4.37255859375, 4.7535400390625, 5.134521484375, 5.5155029296875, 5.896484375, 6.2774658203125, 6.658447265625, 7.0394287109375, 7.42041015625, 7.8013916015625, 8.182373046875, 8.5633544921875, 8.9443359375, 9.3253173828125, 9.706298828125, 10.0872802734375, 10.46826171875, 10.8492431640625, 11.230224609375, 11.6112060546875, 11.9921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 5.0, 6.0, 6.0, 7.0, 9.0, 10.0, 10.0, 12.0, 8.0, 9.0, 16.0, 20.0, 17.0, 17.0, 21.0, 20.0, 27.0, 28.0, 30.0, 43.0, 36.0, 44.0, 34.0, 33.0, 28.0, 35.0, 30.0, 32.0, 36.0, 44.0, 27.0, 40.0, 31.0, 39.0, 32.0, 15.0, 18.0, 20.0, 11.0, 20.0, 9.0, 14.0, 14.0, 7.0, 4.0, 7.0, 11.0, 4.0, 2.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-11.3046875, -10.97119140625, -10.6376953125, -10.30419921875, -9.970703125, -9.63720703125, -9.3037109375, -8.97021484375, -8.63671875, -8.30322265625, -7.9697265625, -7.63623046875, -7.302734375, -6.96923828125, -6.6357421875, -6.30224609375, -5.96875, -5.63525390625, -5.3017578125, -4.96826171875, -4.634765625, -4.30126953125, -3.9677734375, -3.63427734375, -3.30078125, -2.96728515625, -2.6337890625, -2.30029296875, -1.966796875, -1.63330078125, -1.2998046875, -0.96630859375, -0.6328125, -0.29931640625, 0.0341796875, 0.36767578125, 0.701171875, 1.03466796875, 1.3681640625, 1.70166015625, 2.03515625, 2.36865234375, 2.7021484375, 3.03564453125, 3.369140625, 3.70263671875, 4.0361328125, 4.36962890625, 4.703125, 5.03662109375, 5.3701171875, 5.70361328125, 6.037109375, 6.37060546875, 6.7041015625, 7.03759765625, 7.37109375, 7.70458984375, 8.0380859375, 8.37158203125, 8.705078125, 9.03857421875, 9.3720703125, 9.70556640625, 10.0390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 9.0, 4.0, 4.0, 5.0, 8.0, 11.0, 28.0, 25.0, 29.0, 39.0, 57.0, 78.0, 129.0, 145.0, 195.0, 324.0, 515.0, 890.0, 1440.0, 2358.0, 4018.0, 6918.0, 11719.0, 20481.0, 34139.0, 54149.0, 80280.0, 109212.0, 133122.0, 142113.0, 131400.0, 106879.0, 77250.0, 51634.0, 32152.0, 19270.0, 11108.0, 6631.0, 3755.0, 2212.0, 1367.0, 807.0, 522.0, 343.0, 237.0, 152.0, 106.0, 85.0, 61.0, 34.0, 30.0, 29.0, 12.0, 16.0, 14.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0], "bins": [-5.51953125, -5.34942626953125, -5.1793212890625, -5.00921630859375, -4.839111328125, -4.66900634765625, -4.4989013671875, -4.32879638671875, -4.15869140625, -3.98858642578125, -3.8184814453125, -3.64837646484375, -3.478271484375, -3.30816650390625, -3.1380615234375, -2.96795654296875, -2.7978515625, -2.62774658203125, -2.4576416015625, -2.28753662109375, -2.117431640625, -1.94732666015625, -1.7772216796875, -1.60711669921875, -1.43701171875, -1.26690673828125, -1.0968017578125, -0.92669677734375, -0.756591796875, -0.58648681640625, -0.4163818359375, -0.24627685546875, -0.076171875, 0.09393310546875, 0.2640380859375, 0.43414306640625, 0.604248046875, 0.77435302734375, 0.9444580078125, 1.11456298828125, 1.28466796875, 1.45477294921875, 1.6248779296875, 1.79498291015625, 1.965087890625, 2.13519287109375, 2.3052978515625, 2.47540283203125, 2.6455078125, 2.81561279296875, 2.9857177734375, 3.15582275390625, 3.325927734375, 3.49603271484375, 3.6661376953125, 3.83624267578125, 4.00634765625, 4.17645263671875, 4.3465576171875, 4.51666259765625, 4.686767578125, 4.85687255859375, 5.0269775390625, 5.19708251953125, 5.3671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 13.0, 6.0, 19.0, 23.0, 20.0, 28.0, 42.0, 54.0, 46.0, 62.0, 63.0, 72.0, 63.0, 66.0, 59.0, 60.0, 42.0, 48.0, 42.0, 40.0, 29.0, 22.0, 22.0, 21.0, 12.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008058547973632812, -0.0007820576429367065, -0.0007582604885101318, -0.0007344633340835571, -0.0007106661796569824, -0.0006868690252304077, -0.000663071870803833, -0.0006392747163772583, -0.0006154775619506836, -0.0005916804075241089, -0.0005678832530975342, -0.0005440860986709595, -0.0005202889442443848, -0.0004964917898178101, -0.00047269463539123535, -0.00044889748096466064, -0.00042510032653808594, -0.00040130317211151123, -0.0003775060176849365, -0.0003537088632583618, -0.0003299117088317871, -0.0003061145544052124, -0.0002823173999786377, -0.000258520245552063, -0.00023472309112548828, -0.00021092593669891357, -0.00018712878227233887, -0.00016333162784576416, -0.00013953447341918945, -0.00011573731899261475, -9.194016456604004e-05, -6.814301013946533e-05, -4.4345855712890625e-05, -2.0548701286315918e-05, 3.248453140258789e-06, 2.7045607566833496e-05, 5.08427619934082e-05, 7.463991641998291e-05, 9.843707084655762e-05, 0.00012223422527313232, 0.00014603137969970703, 0.00016982853412628174, 0.00019362568855285645, 0.00021742284297943115, 0.00024121999740600586, 0.00026501715183258057, 0.0002888143062591553, 0.00031261146068573, 0.0003364086151123047, 0.0003602057695388794, 0.0003840029239654541, 0.0004078000783920288, 0.0004315972328186035, 0.0004553943872451782, 0.00047919154167175293, 0.0005029886960983276, 0.0005267858505249023, 0.000550583004951477, 0.0005743801593780518, 0.0005981773138046265, 0.0006219744682312012, 0.0006457716226577759, 0.0006695687770843506, 0.0006933659315109253, 0.0007171630859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 7.0, 11.0, 17.0, 33.0, 50.0, 84.0, 143.0, 241.0, 449.0, 914.0, 1830.0, 4061.0, 9376.0, 21553.0, 48686.0, 96879.0, 162618.0, 210624.0, 200987.0, 141957.0, 79695.0, 38132.0, 16703.0, 7252.0, 3139.0, 1486.0, 714.0, 408.0, 195.0, 109.0, 65.0, 42.0, 23.0, 19.0, 18.0, 12.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5234375, -9.2420654296875, -8.960693359375, -8.6793212890625, -8.39794921875, -8.1165771484375, -7.835205078125, -7.5538330078125, -7.2724609375, -6.9910888671875, -6.709716796875, -6.4283447265625, -6.14697265625, -5.8656005859375, -5.584228515625, -5.3028564453125, -5.021484375, -4.7401123046875, -4.458740234375, -4.1773681640625, -3.89599609375, -3.6146240234375, -3.333251953125, -3.0518798828125, -2.7705078125, -2.4891357421875, -2.207763671875, -1.9263916015625, -1.64501953125, -1.3636474609375, -1.082275390625, -0.8009033203125, -0.51953125, -0.2381591796875, 0.043212890625, 0.3245849609375, 0.60595703125, 0.8873291015625, 1.168701171875, 1.4500732421875, 1.7314453125, 2.0128173828125, 2.294189453125, 2.5755615234375, 2.85693359375, 3.1383056640625, 3.419677734375, 3.7010498046875, 3.982421875, 4.2637939453125, 4.545166015625, 4.8265380859375, 5.10791015625, 5.3892822265625, 5.670654296875, 5.9520263671875, 6.2333984375, 6.5147705078125, 6.796142578125, 7.0775146484375, 7.35888671875, 7.6402587890625, 7.921630859375, 8.2030029296875, 8.484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 1.0, 3.0, 6.0, 13.0, 12.0, 11.0, 19.0, 20.0, 20.0, 28.0, 17.0, 29.0, 37.0, 35.0, 37.0, 38.0, 44.0, 38.0, 36.0, 49.0, 46.0, 42.0, 53.0, 42.0, 46.0, 36.0, 26.0, 19.0, 21.0, 30.0, 24.0, 15.0, 22.0, 14.0, 12.0, 13.0, 10.0, 6.0, 5.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.03515625, -1.971221923828125, -1.90728759765625, -1.843353271484375, -1.7794189453125, -1.715484619140625, -1.65155029296875, -1.587615966796875, -1.523681640625, -1.459747314453125, -1.39581298828125, -1.331878662109375, -1.2679443359375, -1.204010009765625, -1.14007568359375, -1.076141357421875, -1.01220703125, -0.948272705078125, -0.88433837890625, -0.820404052734375, -0.7564697265625, -0.692535400390625, -0.62860107421875, -0.564666748046875, -0.500732421875, -0.436798095703125, -0.37286376953125, -0.308929443359375, -0.2449951171875, -0.181060791015625, -0.11712646484375, -0.053192138671875, 0.0107421875, 0.074676513671875, 0.13861083984375, 0.202545166015625, 0.2664794921875, 0.330413818359375, 0.39434814453125, 0.458282470703125, 0.522216796875, 0.586151123046875, 0.65008544921875, 0.714019775390625, 0.7779541015625, 0.841888427734375, 0.90582275390625, 0.969757080078125, 1.03369140625, 1.097625732421875, 1.16156005859375, 1.225494384765625, 1.2894287109375, 1.353363037109375, 1.41729736328125, 1.481231689453125, 1.545166015625, 1.609100341796875, 1.67303466796875, 1.736968994140625, 1.8009033203125, 1.864837646484375, 1.92877197265625, 1.992706298828125, 2.056640625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 5.0, 4.0, 7.0, 13.0, 18.0, 16.0, 15.0, 25.0, 26.0, 21.0, 39.0, 32.0, 35.0, 55.0, 40.0, 51.0, 59.0, 51.0, 46.0, 55.0, 59.0, 43.0, 47.0, 42.0, 32.0, 24.0, 27.0, 19.0, 21.0, 18.0, 12.0, 12.0, 11.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.590105056762695, -22.868511199951172, -22.14691734313965, -21.425323486328125, -20.703731536865234, -19.98213768005371, -19.260543823242188, -18.538949966430664, -17.81735610961914, -17.095762252807617, -16.374168395996094, -15.652575492858887, -14.93098258972168, -14.209388732910156, -13.487794876098633, -12.76620101928711, -12.044609069824219, -11.323015213012695, -10.601422309875488, -9.879828453063965, -9.158235549926758, -8.436641693115234, -7.715047836303711, -6.993454456329346, -6.2718610763549805, -5.550267696380615, -4.82867431640625, -4.107080459594727, -3.3854870796203613, -2.663893699645996, -1.9422998428344727, -1.2207064628601074, -0.4991111755371094, 0.2224823236465454, 0.9440758228302002, 1.6656694412231445, 2.3872628211975098, 3.108856201171875, 3.8304500579833984, 4.552043437957764, 5.273636817932129, 5.995230197906494, 6.716823577880859, 7.438417434692383, 8.160011291503906, 8.881604194641113, 9.603198051452637, 10.324790954589844, 11.046384811401367, 11.76797866821289, 12.489571571350098, 13.211165428161621, 13.932758331298828, 14.654352188110352, 15.375946044921875, 16.0975399017334, 16.819133758544922, 17.540727615356445, 18.26232147216797, 18.98391342163086, 19.705507278442383, 20.427101135253906, 21.14869499206543, 21.870288848876953, 22.591880798339844]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 5.0, 3.0, 8.0, 9.0, 13.0, 17.0, 15.0, 19.0, 22.0, 23.0, 23.0, 23.0, 32.0, 30.0, 33.0, 35.0, 36.0, 31.0, 52.0, 41.0, 40.0, 37.0, 42.0, 33.0, 27.0, 37.0, 43.0, 31.0, 31.0, 27.0, 28.0, 22.0, 26.0, 16.0, 13.0, 11.0, 10.0, 10.0, 12.0, 5.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.025646209716797, -19.424264907836914, -18.822885513305664, -18.22150421142578, -17.6201229095459, -17.018741607666016, -16.417362213134766, -15.815980911254883, -15.214600563049316, -14.61322021484375, -14.011838912963867, -13.4104585647583, -12.809078216552734, -12.207696914672852, -11.606316566467285, -11.004936218261719, -10.403554916381836, -9.80217456817627, -9.200793266296387, -8.59941291809082, -7.998032093048096, -7.396651268005371, -6.795270919799805, -6.19389009475708, -5.5925092697143555, -4.991128444671631, -4.389747619628906, -3.78836727142334, -3.1869864463806152, -2.5856056213378906, -1.9842250347137451, -1.3828444480895996, -0.7814655303955078, -0.18008482456207275, 0.4212958812713623, 1.0226765871047974, 1.6240572929382324, 2.225438117980957, 2.8268187046051025, 3.428199291229248, 4.029580116271973, 4.630960941314697, 5.232341766357422, 5.833722114562988, 6.435102939605713, 7.0364837646484375, 7.637864112854004, 8.23924446105957, 8.840625762939453, 9.44200611114502, 10.043387413024902, 10.644767761230469, 11.246149063110352, 11.847529411315918, 12.448909759521484, 13.050291061401367, 13.651671409606934, 14.2530517578125, 14.854433059692383, 15.45581340789795, 16.057193756103516, 16.6585750579834, 17.25995635986328, 17.86133575439453, 18.462717056274414]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 8.0, 16.0, 17.0, 24.0, 50.0, 73.0, 96.0, 180.0, 314.0, 509.0, 802.0, 1433.0, 2259.0, 3906.0, 6950.0, 12280.0, 22274.0, 39845.0, 74017.0, 138748.0, 255226.0, 437647.0, 644232.0, 753910.0, 680457.0, 481907.0, 289734.0, 159228.0, 85117.0, 46216.0, 24997.0, 13652.0, 7635.0, 4411.0, 2524.0, 1450.0, 816.0, 491.0, 339.0, 204.0, 111.0, 69.0, 43.0, 32.0, 17.0, 10.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-20.765625, -20.16552734375, -19.5654296875, -18.96533203125, -18.365234375, -17.76513671875, -17.1650390625, -16.56494140625, -15.96484375, -15.36474609375, -14.7646484375, -14.16455078125, -13.564453125, -12.96435546875, -12.3642578125, -11.76416015625, -11.1640625, -10.56396484375, -9.9638671875, -9.36376953125, -8.763671875, -8.16357421875, -7.5634765625, -6.96337890625, -6.36328125, -5.76318359375, -5.1630859375, -4.56298828125, -3.962890625, -3.36279296875, -2.7626953125, -2.16259765625, -1.5625, -0.96240234375, -0.3623046875, 0.23779296875, 0.837890625, 1.43798828125, 2.0380859375, 2.63818359375, 3.23828125, 3.83837890625, 4.4384765625, 5.03857421875, 5.638671875, 6.23876953125, 6.8388671875, 7.43896484375, 8.0390625, 8.63916015625, 9.2392578125, 9.83935546875, 10.439453125, 11.03955078125, 11.6396484375, 12.23974609375, 12.83984375, 13.43994140625, 14.0400390625, 14.64013671875, 15.240234375, 15.84033203125, 16.4404296875, 17.04052734375, 17.640625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 4.0, 5.0, 5.0, 10.0, 18.0, 11.0, 15.0, 13.0, 16.0, 25.0, 28.0, 29.0, 22.0, 36.0, 36.0, 42.0, 41.0, 35.0, 28.0, 41.0, 36.0, 48.0, 26.0, 42.0, 42.0, 42.0, 32.0, 38.0, 27.0, 26.0, 23.0, 27.0, 27.0, 19.0, 11.0, 15.0, 10.0, 12.0, 8.0, 8.0, 1.0, 3.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.20556640625, -16.6611328125, -16.11669921875, -15.572265625, -15.02783203125, -14.4833984375, -13.93896484375, -13.39453125, -12.85009765625, -12.3056640625, -11.76123046875, -11.216796875, -10.67236328125, -10.1279296875, -9.58349609375, -9.0390625, -8.49462890625, -7.9501953125, -7.40576171875, -6.861328125, -6.31689453125, -5.7724609375, -5.22802734375, -4.68359375, -4.13916015625, -3.5947265625, -3.05029296875, -2.505859375, -1.96142578125, -1.4169921875, -0.87255859375, -0.328125, 0.21630859375, 0.7607421875, 1.30517578125, 1.849609375, 2.39404296875, 2.9384765625, 3.48291015625, 4.02734375, 4.57177734375, 5.1162109375, 5.66064453125, 6.205078125, 6.74951171875, 7.2939453125, 7.83837890625, 8.3828125, 8.92724609375, 9.4716796875, 10.01611328125, 10.560546875, 11.10498046875, 11.6494140625, 12.19384765625, 12.73828125, 13.28271484375, 13.8271484375, 14.37158203125, 14.916015625, 15.46044921875, 16.0048828125, 16.54931640625, 17.09375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 12.0, 13.0, 17.0, 20.0, 31.0, 43.0, 66.0, 111.0, 225.0, 359.0, 554.0, 833.0, 1445.0, 2456.0, 4222.0, 6995.0, 12300.0, 21802.0, 38619.0, 67962.0, 121255.0, 207646.0, 340937.0, 503460.0, 641292.0, 667034.0, 562486.0, 396834.0, 251241.0, 148556.0, 84699.0, 47378.0, 26882.0, 15239.0, 8817.0, 4945.0, 3026.0, 1720.0, 1043.0, 634.0, 398.0, 240.0, 152.0, 109.0, 60.0, 38.0, 34.0, 14.0, 8.0, 9.0, 6.0, 6.0, 3.0, 3.0], "bins": [-23.3125, -22.64990234375, -21.9873046875, -21.32470703125, -20.662109375, -19.99951171875, -19.3369140625, -18.67431640625, -18.01171875, -17.34912109375, -16.6865234375, -16.02392578125, -15.361328125, -14.69873046875, -14.0361328125, -13.37353515625, -12.7109375, -12.04833984375, -11.3857421875, -10.72314453125, -10.060546875, -9.39794921875, -8.7353515625, -8.07275390625, -7.41015625, -6.74755859375, -6.0849609375, -5.42236328125, -4.759765625, -4.09716796875, -3.4345703125, -2.77197265625, -2.109375, -1.44677734375, -0.7841796875, -0.12158203125, 0.541015625, 1.20361328125, 1.8662109375, 2.52880859375, 3.19140625, 3.85400390625, 4.5166015625, 5.17919921875, 5.841796875, 6.50439453125, 7.1669921875, 7.82958984375, 8.4921875, 9.15478515625, 9.8173828125, 10.47998046875, 11.142578125, 11.80517578125, 12.4677734375, 13.13037109375, 13.79296875, 14.45556640625, 15.1181640625, 15.78076171875, 16.443359375, 17.10595703125, 17.7685546875, 18.43115234375, 19.09375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 22.0, 16.0, 24.0, 29.0, 46.0, 35.0, 53.0, 53.0, 66.0, 77.0, 103.0, 121.0, 162.0, 150.0, 174.0, 194.0, 199.0, 189.0, 210.0, 215.0, 220.0, 187.0, 190.0, 156.0, 169.0, 186.0, 137.0, 97.0, 91.0, 81.0, 91.0, 61.0, 54.0, 45.0, 26.0, 34.0, 25.0, 18.0, 20.0, 11.0, 6.0, 7.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.97265625, -7.73333740234375, -7.4940185546875, -7.25469970703125, -7.015380859375, -6.77606201171875, -6.5367431640625, -6.29742431640625, -6.05810546875, -5.81878662109375, -5.5794677734375, -5.34014892578125, -5.100830078125, -4.86151123046875, -4.6221923828125, -4.38287353515625, -4.1435546875, -3.90423583984375, -3.6649169921875, -3.42559814453125, -3.186279296875, -2.94696044921875, -2.7076416015625, -2.46832275390625, -2.22900390625, -1.98968505859375, -1.7503662109375, -1.51104736328125, -1.271728515625, -1.03240966796875, -0.7930908203125, -0.55377197265625, -0.314453125, -0.07513427734375, 0.1641845703125, 0.40350341796875, 0.642822265625, 0.88214111328125, 1.1214599609375, 1.36077880859375, 1.60009765625, 1.83941650390625, 2.0787353515625, 2.31805419921875, 2.557373046875, 2.79669189453125, 3.0360107421875, 3.27532958984375, 3.5146484375, 3.75396728515625, 3.9932861328125, 4.23260498046875, 4.471923828125, 4.71124267578125, 4.9505615234375, 5.18988037109375, 5.42919921875, 5.66851806640625, 5.9078369140625, 6.14715576171875, 6.386474609375, 6.62579345703125, 6.8651123046875, 7.10443115234375, 7.34375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 3.0, 6.0, 13.0, 12.0, 24.0, 23.0, 13.0, 27.0, 24.0, 36.0, 36.0, 42.0, 43.0, 33.0, 40.0, 45.0, 37.0, 47.0, 44.0, 32.0, 47.0, 43.0, 39.0, 49.0, 37.0, 30.0, 22.0, 17.0, 21.0, 22.0, 12.0, 14.0, 10.0, 8.0, 8.0, 5.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.688480377197266, -21.00305938720703, -20.317638397216797, -19.632217407226562, -18.946796417236328, -18.261375427246094, -17.57595443725586, -16.890533447265625, -16.20511245727539, -15.519691467285156, -14.834270477294922, -14.148849487304688, -13.463428497314453, -12.778007507324219, -12.092586517333984, -11.40716552734375, -10.721744537353516, -10.036323547363281, -9.350902557373047, -8.665481567382812, -7.980060577392578, -7.294639587402344, -6.609218597412109, -5.923797607421875, -5.238376617431641, -4.552955627441406, -3.867534637451172, -3.1821136474609375, -2.496692657470703, -1.8112716674804688, -1.1258506774902344, -0.4404296875, 0.2449932098388672, 0.9304141998291016, 1.615835189819336, 2.3012561798095703, 2.9866771697998047, 3.672098159790039, 4.357519149780273, 5.042940139770508, 5.728361129760742, 6.413782119750977, 7.099203109741211, 7.784624099731445, 8.47004508972168, 9.155466079711914, 9.840887069702148, 10.526308059692383, 11.211729049682617, 11.897150039672852, 12.582571029663086, 13.26799201965332, 13.953413009643555, 14.638833999633789, 15.324254989624023, 16.009675979614258, 16.695096969604492, 17.380517959594727, 18.06593894958496, 18.751359939575195, 19.43678092956543, 20.122201919555664, 20.8076229095459, 21.493043899536133, 22.178464889526367]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 10.0, 1.0, 9.0, 11.0, 6.0, 11.0, 20.0, 18.0, 17.0, 23.0, 30.0, 31.0, 29.0, 25.0, 35.0, 20.0, 39.0, 44.0, 42.0, 42.0, 41.0, 38.0, 44.0, 37.0, 33.0, 29.0, 38.0, 28.0, 39.0, 31.0, 29.0, 20.0, 20.0, 21.0, 18.0, 8.0, 22.0, 12.0, 6.0, 5.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-21.586881637573242, -20.977073669433594, -20.367265701293945, -19.75745964050293, -19.14765167236328, -18.537843704223633, -17.928035736083984, -17.318227767944336, -16.708419799804688, -16.09861183166504, -15.488804817199707, -14.878996849060059, -14.269189834594727, -13.659381866455078, -13.04957389831543, -12.439765930175781, -11.829959869384766, -11.220151901245117, -10.610344886779785, -10.000536918640137, -9.390729904174805, -8.780921936035156, -8.171113967895508, -7.561306476593018, -6.951498985290527, -6.341691493988037, -5.731884002685547, -5.122076034545898, -4.512268543243408, -3.902461051940918, -3.2926533222198486, -2.6828455924987793, -2.0730361938476562, -1.4632285833358765, -0.8534209728240967, -0.2436133623123169, 0.3661942481994629, 0.9760017395019531, 1.5858094692230225, 2.195617198944092, 2.805424690246582, 3.4152321815490723, 4.0250396728515625, 4.634847640991211, 5.244655132293701, 5.854462623596191, 6.46427059173584, 7.07407808303833, 7.68388557434082, 8.293693542480469, 8.9035005569458, 9.51330852508545, 10.123115539550781, 10.73292350769043, 11.342731475830078, 11.952539443969727, 12.562346458435059, 13.172154426574707, 13.781961441040039, 14.391769409179688, 15.001577377319336, 15.611384391784668, 16.22119140625, 16.83099937438965, 17.440807342529297]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 11.0, 15.0, 17.0, 32.0, 42.0, 59.0, 103.0, 189.0, 287.0, 433.0, 840.0, 1281.0, 2132.0, 3450.0, 5807.0, 9425.0, 15380.0, 24199.0, 37753.0, 56445.0, 78767.0, 103510.0, 122143.0, 129642.0, 122266.0, 102189.0, 77753.0, 55303.0, 36906.0, 23439.0, 15006.0, 9273.0, 5704.0, 3398.0, 2071.0, 1292.0, 780.0, 434.0, 293.0, 186.0, 96.0, 75.0, 52.0, 27.0, 13.0, 15.0, 9.0, 9.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.0703125, -9.7503662109375, -9.430419921875, -9.1104736328125, -8.79052734375, -8.4705810546875, -8.150634765625, -7.8306884765625, -7.5107421875, -7.1907958984375, -6.870849609375, -6.5509033203125, -6.23095703125, -5.9110107421875, -5.591064453125, -5.2711181640625, -4.951171875, -4.6312255859375, -4.311279296875, -3.9913330078125, -3.67138671875, -3.3514404296875, -3.031494140625, -2.7115478515625, -2.3916015625, -2.0716552734375, -1.751708984375, -1.4317626953125, -1.11181640625, -0.7918701171875, -0.471923828125, -0.1519775390625, 0.16796875, 0.4879150390625, 0.807861328125, 1.1278076171875, 1.44775390625, 1.7677001953125, 2.087646484375, 2.4075927734375, 2.7275390625, 3.0474853515625, 3.367431640625, 3.6873779296875, 4.00732421875, 4.3272705078125, 4.647216796875, 4.9671630859375, 5.287109375, 5.6070556640625, 5.927001953125, 6.2469482421875, 6.56689453125, 6.8868408203125, 7.206787109375, 7.5267333984375, 7.8466796875, 8.1666259765625, 8.486572265625, 8.8065185546875, 9.12646484375, 9.4464111328125, 9.766357421875, 10.0863037109375, 10.40625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 13.0, 9.0, 15.0, 11.0, 15.0, 21.0, 22.0, 18.0, 29.0, 31.0, 33.0, 40.0, 36.0, 46.0, 35.0, 39.0, 31.0, 54.0, 45.0, 57.0, 29.0, 28.0, 43.0, 40.0, 27.0, 37.0, 16.0, 27.0, 22.0, 22.0, 17.0, 17.0, 20.0, 8.0, 8.0, 9.0, 0.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.779541015625, -21.10595703125, -20.432373046875, -19.7587890625, -19.085205078125, -18.41162109375, -17.738037109375, -17.064453125, -16.390869140625, -15.71728515625, -15.043701171875, -14.3701171875, -13.696533203125, -13.02294921875, -12.349365234375, -11.67578125, -11.002197265625, -10.32861328125, -9.655029296875, -8.9814453125, -8.307861328125, -7.63427734375, -6.960693359375, -6.287109375, -5.613525390625, -4.93994140625, -4.266357421875, -3.5927734375, -2.919189453125, -2.24560546875, -1.572021484375, -0.8984375, -0.224853515625, 0.44873046875, 1.122314453125, 1.7958984375, 2.469482421875, 3.14306640625, 3.816650390625, 4.490234375, 5.163818359375, 5.83740234375, 6.510986328125, 7.1845703125, 7.858154296875, 8.53173828125, 9.205322265625, 9.87890625, 10.552490234375, 11.22607421875, 11.899658203125, 12.5732421875, 13.246826171875, 13.92041015625, 14.593994140625, 15.267578125, 15.941162109375, 16.61474609375, 17.288330078125, 17.9619140625, 18.635498046875, 19.30908203125, 19.982666015625, 20.65625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 9.0, 14.0, 30.0, 62.0, 63.0, 136.0, 162.0, 329.0, 558.0, 989.0, 1690.0, 3396.0, 6341.0, 12459.0, 24826.0, 48642.0, 91478.0, 152537.0, 204233.0, 196676.0, 138537.0, 79905.0, 41582.0, 21276.0, 10573.0, 5522.0, 2854.0, 1552.0, 866.0, 507.0, 299.0, 156.0, 122.0, 54.0, 47.0, 28.0, 22.0, 8.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.09375, -19.482666015625, -18.87158203125, -18.260498046875, -17.6494140625, -17.038330078125, -16.42724609375, -15.816162109375, -15.205078125, -14.593994140625, -13.98291015625, -13.371826171875, -12.7607421875, -12.149658203125, -11.53857421875, -10.927490234375, -10.31640625, -9.705322265625, -9.09423828125, -8.483154296875, -7.8720703125, -7.260986328125, -6.64990234375, -6.038818359375, -5.427734375, -4.816650390625, -4.20556640625, -3.594482421875, -2.9833984375, -2.372314453125, -1.76123046875, -1.150146484375, -0.5390625, 0.072021484375, 0.68310546875, 1.294189453125, 1.9052734375, 2.516357421875, 3.12744140625, 3.738525390625, 4.349609375, 4.960693359375, 5.57177734375, 6.182861328125, 6.7939453125, 7.405029296875, 8.01611328125, 8.627197265625, 9.23828125, 9.849365234375, 10.46044921875, 11.071533203125, 11.6826171875, 12.293701171875, 12.90478515625, 13.515869140625, 14.126953125, 14.738037109375, 15.34912109375, 15.960205078125, 16.5712890625, 17.182373046875, 17.79345703125, 18.404541015625, 19.015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 7.0, 6.0, 10.0, 19.0, 17.0, 19.0, 17.0, 23.0, 22.0, 28.0, 22.0, 32.0, 31.0, 27.0, 27.0, 31.0, 36.0, 36.0, 37.0, 38.0, 44.0, 39.0, 38.0, 34.0, 40.0, 32.0, 29.0, 29.0, 25.0, 23.0, 28.0, 24.0, 25.0, 13.0, 15.0, 12.0, 14.0, 6.0, 3.0, 4.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.828125, -11.44921875, -11.0703125, -10.69140625, -10.3125, -9.93359375, -9.5546875, -9.17578125, -8.796875, -8.41796875, -8.0390625, -7.66015625, -7.28125, -6.90234375, -6.5234375, -6.14453125, -5.765625, -5.38671875, -5.0078125, -4.62890625, -4.25, -3.87109375, -3.4921875, -3.11328125, -2.734375, -2.35546875, -1.9765625, -1.59765625, -1.21875, -0.83984375, -0.4609375, -0.08203125, 0.296875, 0.67578125, 1.0546875, 1.43359375, 1.8125, 2.19140625, 2.5703125, 2.94921875, 3.328125, 3.70703125, 4.0859375, 4.46484375, 4.84375, 5.22265625, 5.6015625, 5.98046875, 6.359375, 6.73828125, 7.1171875, 7.49609375, 7.875, 8.25390625, 8.6328125, 9.01171875, 9.390625, 9.76953125, 10.1484375, 10.52734375, 10.90625, 11.28515625, 11.6640625, 12.04296875, 12.421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 9.0, 7.0, 16.0, 17.0, 21.0, 48.0, 47.0, 68.0, 102.0, 129.0, 192.0, 292.0, 430.0, 708.0, 1079.0, 1927.0, 3060.0, 5277.0, 9241.0, 16200.0, 28533.0, 49199.0, 84148.0, 130772.0, 174071.0, 179076.0, 140652.0, 92088.0, 55373.0, 31978.0, 18212.0, 10494.0, 5984.0, 3488.0, 2079.0, 1245.0, 769.0, 485.0, 335.0, 214.0, 150.0, 105.0, 65.0, 59.0, 28.0, 23.0, 19.0, 13.0, 7.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.75390625, -6.5367431640625, -6.319580078125, -6.1024169921875, -5.88525390625, -5.6680908203125, -5.450927734375, -5.2337646484375, -5.0166015625, -4.7994384765625, -4.582275390625, -4.3651123046875, -4.14794921875, -3.9307861328125, -3.713623046875, -3.4964599609375, -3.279296875, -3.0621337890625, -2.844970703125, -2.6278076171875, -2.41064453125, -2.1934814453125, -1.976318359375, -1.7591552734375, -1.5419921875, -1.3248291015625, -1.107666015625, -0.8905029296875, -0.67333984375, -0.4561767578125, -0.239013671875, -0.0218505859375, 0.1953125, 0.4124755859375, 0.629638671875, 0.8468017578125, 1.06396484375, 1.2811279296875, 1.498291015625, 1.7154541015625, 1.9326171875, 2.1497802734375, 2.366943359375, 2.5841064453125, 2.80126953125, 3.0184326171875, 3.235595703125, 3.4527587890625, 3.669921875, 3.8870849609375, 4.104248046875, 4.3214111328125, 4.53857421875, 4.7557373046875, 4.972900390625, 5.1900634765625, 5.4072265625, 5.6243896484375, 5.841552734375, 6.0587158203125, 6.27587890625, 6.4930419921875, 6.710205078125, 6.9273681640625, 7.14453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 10.0, 3.0, 11.0, 18.0, 18.0, 29.0, 25.0, 35.0, 38.0, 45.0, 45.0, 53.0, 49.0, 49.0, 44.0, 65.0, 50.0, 56.0, 58.0, 47.0, 37.0, 40.0, 27.0, 27.0, 28.0, 21.0, 17.0, 12.0, 8.0, 9.0, 8.0, 0.0, 2.0, 3.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004208087921142578, -0.0004077740013599396, -0.00039473921060562134, -0.0003817044198513031, -0.00036866962909698486, -0.0003556348383426666, -0.0003426000475883484, -0.00032956525683403015, -0.0003165304660797119, -0.0003034956753253937, -0.00029046088457107544, -0.0002774260938167572, -0.00026439130306243896, -0.00025135651230812073, -0.0002383217215538025, -0.00022528693079948425, -0.00021225214004516602, -0.00019921734929084778, -0.00018618255853652954, -0.0001731477677822113, -0.00016011297702789307, -0.00014707818627357483, -0.0001340433955192566, -0.00012100860476493835, -0.00010797381401062012, -9.493902325630188e-05, -8.190423250198364e-05, -6.88694417476654e-05, -5.583465099334717e-05, -4.279986023902893e-05, -2.9765069484710693e-05, -1.6730278730392456e-05, -3.6954879760742188e-06, 9.339302778244019e-06, 2.2374093532562256e-05, 3.540888428688049e-05, 4.844367504119873e-05, 6.147846579551697e-05, 7.45132565498352e-05, 8.754804730415344e-05, 0.00010058283805847168, 0.00011361762881278992, 0.00012665241956710815, 0.0001396872103214264, 0.00015272200107574463, 0.00016575679183006287, 0.0001787915825843811, 0.00019182637333869934, 0.00020486116409301758, 0.00021789595484733582, 0.00023093074560165405, 0.0002439655363559723, 0.00025700032711029053, 0.00027003511786460876, 0.000283069908618927, 0.00029610469937324524, 0.0003091394901275635, 0.0003221742808818817, 0.00033520907163619995, 0.0003482438623905182, 0.0003612786531448364, 0.00037431344389915466, 0.0003873482346534729, 0.00040038302540779114, 0.0004134178161621094]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 9.0, 8.0, 13.0, 21.0, 26.0, 42.0, 64.0, 64.0, 100.0, 154.0, 224.0, 353.0, 586.0, 1007.0, 1733.0, 3073.0, 5429.0, 9823.0, 18024.0, 32560.0, 56556.0, 93091.0, 136079.0, 168510.0, 167969.0, 134410.0, 91669.0, 55616.0, 31531.0, 17348.0, 9627.0, 5407.0, 3018.0, 1676.0, 1029.0, 602.0, 365.0, 255.0, 139.0, 98.0, 73.0, 49.0, 44.0, 28.0, 16.0, 16.0, 14.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.3828125, -9.106689453125, -8.83056640625, -8.554443359375, -8.2783203125, -8.002197265625, -7.72607421875, -7.449951171875, -7.173828125, -6.897705078125, -6.62158203125, -6.345458984375, -6.0693359375, -5.793212890625, -5.51708984375, -5.240966796875, -4.96484375, -4.688720703125, -4.41259765625, -4.136474609375, -3.8603515625, -3.584228515625, -3.30810546875, -3.031982421875, -2.755859375, -2.479736328125, -2.20361328125, -1.927490234375, -1.6513671875, -1.375244140625, -1.09912109375, -0.822998046875, -0.546875, -0.270751953125, 0.00537109375, 0.281494140625, 0.5576171875, 0.833740234375, 1.10986328125, 1.385986328125, 1.662109375, 1.938232421875, 2.21435546875, 2.490478515625, 2.7666015625, 3.042724609375, 3.31884765625, 3.594970703125, 3.87109375, 4.147216796875, 4.42333984375, 4.699462890625, 4.9755859375, 5.251708984375, 5.52783203125, 5.803955078125, 6.080078125, 6.356201171875, 6.63232421875, 6.908447265625, 7.1845703125, 7.460693359375, 7.73681640625, 8.012939453125, 8.2890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 11.0, 9.0, 14.0, 14.0, 12.0, 26.0, 23.0, 28.0, 32.0, 27.0, 27.0, 50.0, 53.0, 52.0, 67.0, 69.0, 52.0, 78.0, 49.0, 51.0, 36.0, 40.0, 33.0, 27.0, 13.0, 14.0, 16.0, 11.0, 16.0, 8.0, 10.0, 7.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.671875, -3.570220947265625, -3.46856689453125, -3.366912841796875, -3.2652587890625, -3.163604736328125, -3.06195068359375, -2.960296630859375, -2.858642578125, -2.756988525390625, -2.65533447265625, -2.553680419921875, -2.4520263671875, -2.350372314453125, -2.24871826171875, -2.147064208984375, -2.04541015625, -1.943756103515625, -1.84210205078125, -1.740447998046875, -1.6387939453125, -1.537139892578125, -1.43548583984375, -1.333831787109375, -1.232177734375, -1.130523681640625, -1.02886962890625, -0.927215576171875, -0.8255615234375, -0.723907470703125, -0.62225341796875, -0.520599365234375, -0.4189453125, -0.317291259765625, -0.21563720703125, -0.113983154296875, -0.0123291015625, 0.089324951171875, 0.19097900390625, 0.292633056640625, 0.394287109375, 0.495941162109375, 0.59759521484375, 0.699249267578125, 0.8009033203125, 0.902557373046875, 1.00421142578125, 1.105865478515625, 1.20751953125, 1.309173583984375, 1.41082763671875, 1.512481689453125, 1.6141357421875, 1.715789794921875, 1.81744384765625, 1.919097900390625, 2.020751953125, 2.122406005859375, 2.22406005859375, 2.325714111328125, 2.4273681640625, 2.529022216796875, 2.63067626953125, 2.732330322265625, 2.833984375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 7.0, 2.0, 10.0, 19.0, 17.0, 18.0, 20.0, 35.0, 34.0, 23.0, 28.0, 46.0, 43.0, 37.0, 44.0, 35.0, 44.0, 42.0, 39.0, 43.0, 48.0, 43.0, 36.0, 37.0, 41.0, 27.0, 24.0, 26.0, 21.0, 13.0, 19.0, 10.0, 10.0, 9.0, 9.0, 5.0, 6.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-21.88576316833496, -21.210844039916992, -20.535926818847656, -19.861007690429688, -19.18609046936035, -18.511171340942383, -17.836254119873047, -17.161334991455078, -16.48641586303711, -15.811497688293457, -15.136579513549805, -14.461660385131836, -13.7867431640625, -13.111824035644531, -12.436905860900879, -11.761987686157227, -11.08707046508789, -10.412152290344238, -9.737234115600586, -9.062314987182617, -8.387397766113281, -7.712479114532471, -7.03756046295166, -6.362642288208008, -5.6877241134643555, -5.012805938720703, -4.337887763977051, -3.6629691123962402, -2.988050937652588, -2.3131327629089355, -1.638214111328125, -0.9632959365844727, -0.2883777618408203, 0.3865405321121216, 1.0614588260650635, 1.736377239227295, 2.4112954139709473, 3.0862135887145996, 3.76113224029541, 4.4360504150390625, 5.110968589782715, 5.785886764526367, 6.4608049392700195, 7.13572359085083, 7.810641765594482, 8.485559463500977, 9.160478591918945, 9.835396766662598, 10.51031494140625, 11.185233116149902, 11.860151290893555, 12.535070419311523, 13.20998764038086, 13.884906768798828, 14.55982494354248, 15.234743118286133, 15.909661293029785, 16.584579467773438, 17.259498596191406, 17.934415817260742, 18.60933494567871, 19.284252166748047, 19.959171295166016, 20.634090423583984, 21.30900764465332]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 7.0, 4.0, 11.0, 11.0, 8.0, 19.0, 14.0, 15.0, 21.0, 27.0, 26.0, 21.0, 33.0, 31.0, 21.0, 34.0, 43.0, 41.0, 49.0, 41.0, 35.0, 42.0, 42.0, 31.0, 41.0, 31.0, 33.0, 40.0, 32.0, 29.0, 20.0, 18.0, 22.0, 23.0, 16.0, 14.0, 12.0, 15.0, 4.0, 2.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-21.122201919555664, -20.521953582763672, -19.92170524597168, -19.321456909179688, -18.721210479736328, -18.120962142944336, -17.520713806152344, -16.92046546936035, -16.32021713256836, -15.719968795776367, -15.119721412658691, -14.5194730758667, -13.919224739074707, -13.318977355957031, -12.718729019165039, -12.118480682373047, -11.518233299255371, -10.917984962463379, -10.317737579345703, -9.717489242553711, -9.117240905761719, -8.516992568969727, -7.916745185852051, -7.316496849060059, -6.716248989105225, -6.116001129150391, -5.515752792358398, -4.9155049324035645, -4.3152570724487305, -3.7150087356567383, -3.1147608757019043, -2.514512538909912, -1.9142646789550781, -1.314016580581665, -0.7137686014175415, -0.11352062225341797, 0.4867274761199951, 1.0869755744934082, 1.6872234344482422, 2.2874717712402344, 2.8877196311950684, 3.4879677295684814, 4.0882158279418945, 4.6884636878967285, 5.2887115478515625, 5.888959884643555, 6.489207744598389, 7.089456081390381, 7.689703941345215, 8.289952278137207, 8.890199661254883, 9.490447998046875, 10.090696334838867, 10.69094467163086, 11.291192054748535, 11.891440391540527, 12.491687774658203, 13.091936111450195, 13.692183494567871, 14.292431831359863, 14.892680168151855, 15.492927551269531, 16.093175888061523, 16.693424224853516, 17.293672561645508]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 11.0, 21.0, 29.0, 25.0, 58.0, 75.0, 163.0, 214.0, 379.0, 491.0, 826.0, 1330.0, 2145.0, 3132.0, 5358.0, 8335.0, 12538.0, 19612.0, 28761.0, 41414.0, 57207.0, 74622.0, 91105.0, 103862.0, 109405.0, 106779.0, 96323.0, 80235.0, 62089.0, 46279.0, 32464.0, 22269.0, 14863.0, 9374.0, 6197.0, 3832.0, 2424.0, 1553.0, 968.0, 634.0, 432.0, 247.0, 146.0, 118.0, 81.0, 41.0, 31.0, 28.0, 15.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.9140625, -11.537841796875, -11.16162109375, -10.785400390625, -10.4091796875, -10.032958984375, -9.65673828125, -9.280517578125, -8.904296875, -8.528076171875, -8.15185546875, -7.775634765625, -7.3994140625, -7.023193359375, -6.64697265625, -6.270751953125, -5.89453125, -5.518310546875, -5.14208984375, -4.765869140625, -4.3896484375, -4.013427734375, -3.63720703125, -3.260986328125, -2.884765625, -2.508544921875, -2.13232421875, -1.756103515625, -1.3798828125, -1.003662109375, -0.62744140625, -0.251220703125, 0.125, 0.501220703125, 0.87744140625, 1.253662109375, 1.6298828125, 2.006103515625, 2.38232421875, 2.758544921875, 3.134765625, 3.510986328125, 3.88720703125, 4.263427734375, 4.6396484375, 5.015869140625, 5.39208984375, 5.768310546875, 6.14453125, 6.520751953125, 6.89697265625, 7.273193359375, 7.6494140625, 8.025634765625, 8.40185546875, 8.778076171875, 9.154296875, 9.530517578125, 9.90673828125, 10.282958984375, 10.6591796875, 11.035400390625, 11.41162109375, 11.787841796875, 12.1640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 6.0, 4.0, 4.0, 9.0, 7.0, 12.0, 20.0, 20.0, 20.0, 21.0, 28.0, 27.0, 20.0, 34.0, 16.0, 31.0, 28.0, 36.0, 40.0, 45.0, 48.0, 36.0, 43.0, 33.0, 46.0, 34.0, 32.0, 43.0, 30.0, 30.0, 28.0, 27.0, 22.0, 15.0, 18.0, 20.0, 17.0, 9.0, 7.0, 5.0, 10.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-21.6875, -21.07275390625, -20.4580078125, -19.84326171875, -19.228515625, -18.61376953125, -17.9990234375, -17.38427734375, -16.76953125, -16.15478515625, -15.5400390625, -14.92529296875, -14.310546875, -13.69580078125, -13.0810546875, -12.46630859375, -11.8515625, -11.23681640625, -10.6220703125, -10.00732421875, -9.392578125, -8.77783203125, -8.1630859375, -7.54833984375, -6.93359375, -6.31884765625, -5.7041015625, -5.08935546875, -4.474609375, -3.85986328125, -3.2451171875, -2.63037109375, -2.015625, -1.40087890625, -0.7861328125, -0.17138671875, 0.443359375, 1.05810546875, 1.6728515625, 2.28759765625, 2.90234375, 3.51708984375, 4.1318359375, 4.74658203125, 5.361328125, 5.97607421875, 6.5908203125, 7.20556640625, 7.8203125, 8.43505859375, 9.0498046875, 9.66455078125, 10.279296875, 10.89404296875, 11.5087890625, 12.12353515625, 12.73828125, 13.35302734375, 13.9677734375, 14.58251953125, 15.197265625, 15.81201171875, 16.4267578125, 17.04150390625, 17.65625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 12.0, 16.0, 28.0, 38.0, 63.0, 86.0, 150.0, 240.0, 368.0, 584.0, 926.0, 1378.0, 2022.0, 3180.0, 4875.0, 7592.0, 11614.0, 17454.0, 25653.0, 36966.0, 51042.0, 67242.0, 83563.0, 97712.0, 105939.0, 106969.0, 99330.0, 84981.0, 68460.0, 52067.0, 38047.0, 26941.0, 18287.0, 12085.0, 7871.0, 5245.0, 3416.0, 2208.0, 1429.0, 881.0, 560.0, 369.0, 258.0, 155.0, 108.0, 63.0, 30.0, 23.0, 14.0, 8.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.796875, -12.3975830078125, -11.998291015625, -11.5989990234375, -11.19970703125, -10.8004150390625, -10.401123046875, -10.0018310546875, -9.6025390625, -9.2032470703125, -8.803955078125, -8.4046630859375, -8.00537109375, -7.6060791015625, -7.206787109375, -6.8074951171875, -6.408203125, -6.0089111328125, -5.609619140625, -5.2103271484375, -4.81103515625, -4.4117431640625, -4.012451171875, -3.6131591796875, -3.2138671875, -2.8145751953125, -2.415283203125, -2.0159912109375, -1.61669921875, -1.2174072265625, -0.818115234375, -0.4188232421875, -0.01953125, 0.3797607421875, 0.779052734375, 1.1783447265625, 1.57763671875, 1.9769287109375, 2.376220703125, 2.7755126953125, 3.1748046875, 3.5740966796875, 3.973388671875, 4.3726806640625, 4.77197265625, 5.1712646484375, 5.570556640625, 5.9698486328125, 6.369140625, 6.7684326171875, 7.167724609375, 7.5670166015625, 7.96630859375, 8.3656005859375, 8.764892578125, 9.1641845703125, 9.5634765625, 9.9627685546875, 10.362060546875, 10.7613525390625, 11.16064453125, 11.5599365234375, 11.959228515625, 12.3585205078125, 12.7578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 9.0, 7.0, 7.0, 10.0, 14.0, 14.0, 12.0, 27.0, 19.0, 26.0, 11.0, 22.0, 23.0, 15.0, 33.0, 35.0, 48.0, 32.0, 34.0, 31.0, 45.0, 36.0, 45.0, 46.0, 30.0, 38.0, 31.0, 44.0, 20.0, 38.0, 25.0, 28.0, 22.0, 16.0, 24.0, 17.0, 9.0, 12.0, 9.0, 8.0, 5.0, 6.0, 5.0, 4.0, 5.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.2421875, -11.8603515625, -11.478515625, -11.0966796875, -10.71484375, -10.3330078125, -9.951171875, -9.5693359375, -9.1875, -8.8056640625, -8.423828125, -8.0419921875, -7.66015625, -7.2783203125, -6.896484375, -6.5146484375, -6.1328125, -5.7509765625, -5.369140625, -4.9873046875, -4.60546875, -4.2236328125, -3.841796875, -3.4599609375, -3.078125, -2.6962890625, -2.314453125, -1.9326171875, -1.55078125, -1.1689453125, -0.787109375, -0.4052734375, -0.0234375, 0.3583984375, 0.740234375, 1.1220703125, 1.50390625, 1.8857421875, 2.267578125, 2.6494140625, 3.03125, 3.4130859375, 3.794921875, 4.1767578125, 4.55859375, 4.9404296875, 5.322265625, 5.7041015625, 6.0859375, 6.4677734375, 6.849609375, 7.2314453125, 7.61328125, 7.9951171875, 8.376953125, 8.7587890625, 9.140625, 9.5224609375, 9.904296875, 10.2861328125, 10.66796875, 11.0498046875, 11.431640625, 11.8134765625, 12.1953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 4.0, 4.0, 12.0, 15.0, 18.0, 31.0, 48.0, 60.0, 105.0, 156.0, 273.0, 455.0, 727.0, 1197.0, 1954.0, 3421.0, 5565.0, 9178.0, 14777.0, 23457.0, 35998.0, 53429.0, 74801.0, 96580.0, 115589.0, 123643.0, 119849.0, 104981.0, 83598.0, 61885.0, 42746.0, 27858.0, 17945.0, 11140.0, 6711.0, 4072.0, 2326.0, 1487.0, 923.0, 586.0, 358.0, 215.0, 133.0, 75.0, 52.0, 42.0, 21.0, 20.0, 13.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0], "bins": [-5.26171875, -5.1055908203125, -4.949462890625, -4.7933349609375, -4.63720703125, -4.4810791015625, -4.324951171875, -4.1688232421875, -4.0126953125, -3.8565673828125, -3.700439453125, -3.5443115234375, -3.38818359375, -3.2320556640625, -3.075927734375, -2.9197998046875, -2.763671875, -2.6075439453125, -2.451416015625, -2.2952880859375, -2.13916015625, -1.9830322265625, -1.826904296875, -1.6707763671875, -1.5146484375, -1.3585205078125, -1.202392578125, -1.0462646484375, -0.89013671875, -0.7340087890625, -0.577880859375, -0.4217529296875, -0.265625, -0.1094970703125, 0.046630859375, 0.2027587890625, 0.35888671875, 0.5150146484375, 0.671142578125, 0.8272705078125, 0.9833984375, 1.1395263671875, 1.295654296875, 1.4517822265625, 1.60791015625, 1.7640380859375, 1.920166015625, 2.0762939453125, 2.232421875, 2.3885498046875, 2.544677734375, 2.7008056640625, 2.85693359375, 3.0130615234375, 3.169189453125, 3.3253173828125, 3.4814453125, 3.6375732421875, 3.793701171875, 3.9498291015625, 4.10595703125, 4.2620849609375, 4.418212890625, 4.5743408203125, 4.73046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 13.0, 12.0, 14.0, 20.0, 20.0, 26.0, 35.0, 47.0, 39.0, 47.0, 58.0, 55.0, 54.0, 76.0, 64.0, 59.0, 44.0, 54.0, 41.0, 45.0, 38.0, 35.0, 26.0, 19.0, 7.0, 11.0, 9.0, 6.0, 4.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 4.0], "bins": [-0.0009446144104003906, -0.0009220317006111145, -0.0008994489908218384, -0.0008768662810325623, -0.0008542835712432861, -0.00083170086145401, -0.0008091181516647339, -0.0007865354418754578, -0.0007639527320861816, -0.0007413700222969055, -0.0007187873125076294, -0.0006962046027183533, -0.0006736218929290771, -0.000651039183139801, -0.0006284564733505249, -0.0006058737635612488, -0.0005832910537719727, -0.0005607083439826965, -0.0005381256341934204, -0.0005155429244041443, -0.0004929602146148682, -0.00047037750482559204, -0.0004477947950363159, -0.0004252120852470398, -0.00040262937545776367, -0.00038004666566848755, -0.0003574639558792114, -0.0003348812460899353, -0.0003122985363006592, -0.00028971582651138306, -0.00026713311672210693, -0.0002445504069328308, -0.0002219676971435547, -0.00019938498735427856, -0.00017680227756500244, -0.00015421956777572632, -0.0001316368579864502, -0.00010905414819717407, -8.647143840789795e-05, -6.388872861862183e-05, -4.13060188293457e-05, -1.872330904006958e-05, 3.859400749206543e-06, 2.6442110538482666e-05, 4.902482032775879e-05, 7.160753011703491e-05, 9.419023990631104e-05, 0.00011677294969558716, 0.00013935565948486328, 0.0001619383692741394, 0.00018452107906341553, 0.00020710378885269165, 0.00022968649864196777, 0.0002522692084312439, 0.00027485191822052, 0.00029743462800979614, 0.00032001733779907227, 0.0003426000475883484, 0.0003651827573776245, 0.00038776546716690063, 0.00041034817695617676, 0.0004329308867454529, 0.000455513596534729, 0.0004780963063240051, 0.0005006790161132812]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 7.0, 4.0, 5.0, 15.0, 23.0, 36.0, 49.0, 89.0, 132.0, 212.0, 355.0, 538.0, 893.0, 1385.0, 2345.0, 3903.0, 6233.0, 9958.0, 15447.0, 24215.0, 36396.0, 52171.0, 71662.0, 91304.0, 107826.0, 116725.0, 114352.0, 103639.0, 85936.0, 65325.0, 47221.0, 32350.0, 21490.0, 13735.0, 8676.0, 5395.0, 3272.0, 2009.0, 1211.0, 755.0, 495.0, 276.0, 184.0, 119.0, 71.0, 49.0, 28.0, 26.0, 10.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.03515625, -4.8770751953125, -4.718994140625, -4.5609130859375, -4.40283203125, -4.2447509765625, -4.086669921875, -3.9285888671875, -3.7705078125, -3.6124267578125, -3.454345703125, -3.2962646484375, -3.13818359375, -2.9801025390625, -2.822021484375, -2.6639404296875, -2.505859375, -2.3477783203125, -2.189697265625, -2.0316162109375, -1.87353515625, -1.7154541015625, -1.557373046875, -1.3992919921875, -1.2412109375, -1.0831298828125, -0.925048828125, -0.7669677734375, -0.60888671875, -0.4508056640625, -0.292724609375, -0.1346435546875, 0.0234375, 0.1815185546875, 0.339599609375, 0.4976806640625, 0.65576171875, 0.8138427734375, 0.971923828125, 1.1300048828125, 1.2880859375, 1.4461669921875, 1.604248046875, 1.7623291015625, 1.92041015625, 2.0784912109375, 2.236572265625, 2.3946533203125, 2.552734375, 2.7108154296875, 2.868896484375, 3.0269775390625, 3.18505859375, 3.3431396484375, 3.501220703125, 3.6593017578125, 3.8173828125, 3.9754638671875, 4.133544921875, 4.2916259765625, 4.44970703125, 4.6077880859375, 4.765869140625, 4.9239501953125, 5.08203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 8.0, 15.0, 11.0, 9.0, 17.0, 17.0, 17.0, 28.0, 27.0, 33.0, 33.0, 39.0, 33.0, 57.0, 50.0, 36.0, 37.0, 38.0, 49.0, 60.0, 47.0, 45.0, 39.0, 36.0, 39.0, 23.0, 25.0, 19.0, 24.0, 20.0, 15.0, 11.0, 11.0, 9.0, 1.0, 5.0, 4.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.028167724609375, -1.96063232421875, -1.893096923828125, -1.8255615234375, -1.758026123046875, -1.69049072265625, -1.622955322265625, -1.555419921875, -1.487884521484375, -1.42034912109375, -1.352813720703125, -1.2852783203125, -1.217742919921875, -1.15020751953125, -1.082672119140625, -1.01513671875, -0.947601318359375, -0.88006591796875, -0.812530517578125, -0.7449951171875, -0.677459716796875, -0.60992431640625, -0.542388916015625, -0.474853515625, -0.407318115234375, -0.33978271484375, -0.272247314453125, -0.2047119140625, -0.137176513671875, -0.06964111328125, -0.002105712890625, 0.0654296875, 0.132965087890625, 0.20050048828125, 0.268035888671875, 0.3355712890625, 0.403106689453125, 0.47064208984375, 0.538177490234375, 0.605712890625, 0.673248291015625, 0.74078369140625, 0.808319091796875, 0.8758544921875, 0.943389892578125, 1.01092529296875, 1.078460693359375, 1.14599609375, 1.213531494140625, 1.28106689453125, 1.348602294921875, 1.4161376953125, 1.483673095703125, 1.55120849609375, 1.618743896484375, 1.686279296875, 1.753814697265625, 1.82135009765625, 1.888885498046875, 1.9564208984375, 2.023956298828125, 2.09149169921875, 2.159027099609375, 2.2265625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 9.0, 7.0, 14.0, 15.0, 20.0, 18.0, 27.0, 31.0, 30.0, 26.0, 24.0, 37.0, 53.0, 36.0, 36.0, 34.0, 39.0, 52.0, 40.0, 40.0, 56.0, 43.0, 40.0, 36.0, 21.0, 30.0, 24.0, 25.0, 21.0, 19.0, 16.0, 11.0, 12.0, 6.0, 6.0, 6.0, 4.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.727628707885742, -20.070180892944336, -19.41273307800293, -18.755285263061523, -18.09783935546875, -17.440391540527344, -16.782943725585938, -16.12549591064453, -15.468048095703125, -14.810600280761719, -14.153152465820312, -13.495705604553223, -12.838257789611816, -12.18080997467041, -11.52336311340332, -10.865915298461914, -10.208467483520508, -9.551019668579102, -8.893571853637695, -8.236124992370605, -7.578677177429199, -6.921229362487793, -6.263782024383545, -5.606334686279297, -4.948886871337891, -4.291439056396484, -3.6339917182922363, -2.976544141769409, -2.319096565246582, -1.6616489887237549, -1.0042014122009277, -0.3467540740966797, 0.3106956481933594, 0.9681432247161865, 1.6255908012390137, 2.283038377761841, 2.940485954284668, 3.597933530807495, 4.255381107330322, 4.91282844543457, 5.570276260375977, 6.227724075317383, 6.885171413421631, 7.542618751525879, 8.200066566467285, 8.857514381408691, 9.514961242675781, 10.172409057617188, 10.829856872558594, 11.4873046875, 12.144752502441406, 12.802199363708496, 13.459647178649902, 14.117094993591309, 14.774541854858398, 15.431989669799805, 16.08943748474121, 16.746885299682617, 17.404333114624023, 18.06178092956543, 18.719226837158203, 19.37667465209961, 20.034122467041016, 20.691570281982422, 21.349018096923828]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 9.0, 6.0, 6.0, 12.0, 11.0, 14.0, 15.0, 15.0, 26.0, 27.0, 19.0, 30.0, 34.0, 32.0, 39.0, 33.0, 34.0, 29.0, 40.0, 34.0, 33.0, 28.0, 30.0, 50.0, 40.0, 37.0, 33.0, 33.0, 36.0, 27.0, 18.0, 21.0, 22.0, 12.0, 15.0, 12.0, 19.0, 10.0, 17.0, 9.0, 8.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.596355438232422, -20.969160079956055, -20.341964721679688, -19.714767456054688, -19.08757209777832, -18.460376739501953, -17.833179473876953, -17.205984115600586, -16.57878875732422, -15.951593399047852, -15.324397087097168, -14.697200775146484, -14.070005416870117, -13.44281005859375, -12.815613746643066, -12.188417434692383, -11.561222076416016, -10.934026718139648, -10.306830406188965, -9.679634094238281, -9.052438735961914, -8.425243377685547, -7.798047065734863, -7.170851230621338, -6.5436553955078125, -5.916459560394287, -5.289263725280762, -4.662067890167236, -4.034872055053711, -3.4076762199401855, -2.78048038482666, -2.1532845497131348, -1.5260868072509766, -0.8988909721374512, -0.2716951370239258, 0.3555006980895996, 0.982696533203125, 1.6098923683166504, 2.237088203430176, 2.864284038543701, 3.4914798736572266, 4.118675708770752, 4.745871543884277, 5.373067378997803, 6.000263214111328, 6.6274590492248535, 7.254654884338379, 7.881850719451904, 8.50904655456543, 9.136241912841797, 9.76343822479248, 10.390634536743164, 11.017829895019531, 11.645025253295898, 12.272221565246582, 12.899417877197266, 13.526613235473633, 14.15380859375, 14.781004905700684, 15.408201217651367, 16.035396575927734, 16.6625919342041, 17.28978729248047, 17.91698455810547, 18.544179916381836]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 9.0, 17.0, 16.0, 41.0, 45.0, 74.0, 144.0, 175.0, 302.0, 447.0, 737.0, 1130.0, 1705.0, 2674.0, 4270.0, 6748.0, 10890.0, 17787.0, 29001.0, 47579.0, 79475.0, 131882.0, 215017.0, 335535.0, 479274.0, 592116.0, 616369.0, 535782.0, 400085.0, 265338.0, 165332.0, 99960.0, 60027.0, 36303.0, 22064.0, 13511.0, 8430.0, 5130.0, 3284.0, 1967.0, 1249.0, 800.0, 539.0, 357.0, 237.0, 155.0, 101.0, 62.0, 46.0, 17.0, 10.0, 14.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0], "bins": [-16.890625, -16.366455078125, -15.84228515625, -15.318115234375, -14.7939453125, -14.269775390625, -13.74560546875, -13.221435546875, -12.697265625, -12.173095703125, -11.64892578125, -11.124755859375, -10.6005859375, -10.076416015625, -9.55224609375, -9.028076171875, -8.50390625, -7.979736328125, -7.45556640625, -6.931396484375, -6.4072265625, -5.883056640625, -5.35888671875, -4.834716796875, -4.310546875, -3.786376953125, -3.26220703125, -2.738037109375, -2.2138671875, -1.689697265625, -1.16552734375, -0.641357421875, -0.1171875, 0.406982421875, 0.93115234375, 1.455322265625, 1.9794921875, 2.503662109375, 3.02783203125, 3.552001953125, 4.076171875, 4.600341796875, 5.12451171875, 5.648681640625, 6.1728515625, 6.697021484375, 7.22119140625, 7.745361328125, 8.26953125, 8.793701171875, 9.31787109375, 9.842041015625, 10.3662109375, 10.890380859375, 11.41455078125, 11.938720703125, 12.462890625, 12.987060546875, 13.51123046875, 14.035400390625, 14.5595703125, 15.083740234375, 15.60791015625, 16.132080078125, 16.65625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 5.0, 6.0, 12.0, 15.0, 11.0, 11.0, 17.0, 22.0, 19.0, 26.0, 32.0, 27.0, 27.0, 32.0, 35.0, 26.0, 38.0, 41.0, 38.0, 43.0, 40.0, 37.0, 36.0, 37.0, 43.0, 30.0, 37.0, 25.0, 26.0, 23.0, 16.0, 28.0, 25.0, 10.0, 13.0, 12.0, 16.0, 11.0, 14.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.109375, -19.531494140625, -18.95361328125, -18.375732421875, -17.7978515625, -17.219970703125, -16.64208984375, -16.064208984375, -15.486328125, -14.908447265625, -14.33056640625, -13.752685546875, -13.1748046875, -12.596923828125, -12.01904296875, -11.441162109375, -10.86328125, -10.285400390625, -9.70751953125, -9.129638671875, -8.5517578125, -7.973876953125, -7.39599609375, -6.818115234375, -6.240234375, -5.662353515625, -5.08447265625, -4.506591796875, -3.9287109375, -3.350830078125, -2.77294921875, -2.195068359375, -1.6171875, -1.039306640625, -0.46142578125, 0.116455078125, 0.6943359375, 1.272216796875, 1.85009765625, 2.427978515625, 3.005859375, 3.583740234375, 4.16162109375, 4.739501953125, 5.3173828125, 5.895263671875, 6.47314453125, 7.051025390625, 7.62890625, 8.206787109375, 8.78466796875, 9.362548828125, 9.9404296875, 10.518310546875, 11.09619140625, 11.674072265625, 12.251953125, 12.829833984375, 13.40771484375, 13.985595703125, 14.5634765625, 15.141357421875, 15.71923828125, 16.297119140625, 16.875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 8.0, 16.0, 18.0, 40.0, 52.0, 88.0, 123.0, 216.0, 350.0, 499.0, 744.0, 1226.0, 1973.0, 3094.0, 4941.0, 7989.0, 12677.0, 20922.0, 34789.0, 56383.0, 92603.0, 148635.0, 232955.0, 345432.0, 469421.0, 564385.0, 576920.0, 506943.0, 387521.0, 268122.0, 173769.0, 109144.0, 66776.0, 40837.0, 24626.0, 15097.0, 9155.0, 5844.0, 3677.0, 2271.0, 1493.0, 944.0, 597.0, 356.0, 215.0, 156.0, 91.0, 53.0, 39.0, 26.0, 12.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-19.4375, -18.833251953125, -18.22900390625, -17.624755859375, -17.0205078125, -16.416259765625, -15.81201171875, -15.207763671875, -14.603515625, -13.999267578125, -13.39501953125, -12.790771484375, -12.1865234375, -11.582275390625, -10.97802734375, -10.373779296875, -9.76953125, -9.165283203125, -8.56103515625, -7.956787109375, -7.3525390625, -6.748291015625, -6.14404296875, -5.539794921875, -4.935546875, -4.331298828125, -3.72705078125, -3.122802734375, -2.5185546875, -1.914306640625, -1.31005859375, -0.705810546875, -0.1015625, 0.502685546875, 1.10693359375, 1.711181640625, 2.3154296875, 2.919677734375, 3.52392578125, 4.128173828125, 4.732421875, 5.336669921875, 5.94091796875, 6.545166015625, 7.1494140625, 7.753662109375, 8.35791015625, 8.962158203125, 9.56640625, 10.170654296875, 10.77490234375, 11.379150390625, 11.9833984375, 12.587646484375, 13.19189453125, 13.796142578125, 14.400390625, 15.004638671875, 15.60888671875, 16.213134765625, 16.8173828125, 17.421630859375, 18.02587890625, 18.630126953125, 19.234375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 15.0, 9.0, 16.0, 21.0, 31.0, 33.0, 32.0, 45.0, 74.0, 85.0, 96.0, 121.0, 127.0, 148.0, 181.0, 181.0, 209.0, 215.0, 220.0, 225.0, 257.0, 197.0, 238.0, 212.0, 195.0, 162.0, 132.0, 100.0, 107.0, 75.0, 75.0, 51.0, 38.0, 30.0, 21.0, 24.0, 16.0, 8.0, 13.0, 7.0, 10.0, 4.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.859375, -8.577880859375, -8.29638671875, -8.014892578125, -7.7333984375, -7.451904296875, -7.17041015625, -6.888916015625, -6.607421875, -6.325927734375, -6.04443359375, -5.762939453125, -5.4814453125, -5.199951171875, -4.91845703125, -4.636962890625, -4.35546875, -4.073974609375, -3.79248046875, -3.510986328125, -3.2294921875, -2.947998046875, -2.66650390625, -2.385009765625, -2.103515625, -1.822021484375, -1.54052734375, -1.259033203125, -0.9775390625, -0.696044921875, -0.41455078125, -0.133056640625, 0.1484375, 0.429931640625, 0.71142578125, 0.992919921875, 1.2744140625, 1.555908203125, 1.83740234375, 2.118896484375, 2.400390625, 2.681884765625, 2.96337890625, 3.244873046875, 3.5263671875, 3.807861328125, 4.08935546875, 4.370849609375, 4.65234375, 4.933837890625, 5.21533203125, 5.496826171875, 5.7783203125, 6.059814453125, 6.34130859375, 6.622802734375, 6.904296875, 7.185791015625, 7.46728515625, 7.748779296875, 8.0302734375, 8.311767578125, 8.59326171875, 8.874755859375, 9.15625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 4.0, 9.0, 11.0, 11.0, 5.0, 12.0, 19.0, 21.0, 24.0, 20.0, 24.0, 24.0, 29.0, 33.0, 20.0, 44.0, 51.0, 42.0, 46.0, 40.0, 45.0, 35.0, 41.0, 34.0, 39.0, 33.0, 26.0, 24.0, 33.0, 23.0, 25.0, 25.0, 19.0, 12.0, 16.0, 14.0, 9.0, 10.0, 10.0, 3.0, 7.0, 7.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.27958106994629, -18.638505935668945, -17.9974308013916, -17.35635757446289, -16.715282440185547, -16.074207305908203, -15.43313217163086, -14.792057037353516, -14.150982856750488, -13.509907722473145, -12.868833541870117, -12.227758407592773, -11.58668327331543, -10.945609092712402, -10.304533958435059, -9.663459777832031, -9.022384643554688, -8.381309509277344, -7.740235328674316, -7.099160194396973, -6.458085536956787, -5.817010879516602, -5.175935745239258, -4.534861087799072, -3.8937864303588867, -3.252711772918701, -2.6116368770599365, -1.9705621004104614, -1.3294873237609863, -0.6884126663208008, -0.04733777046203613, 0.5937371253967285, 1.2348098754882812, 1.8758846521377563, 2.5169594287872314, 3.158034324645996, 3.7991089820861816, 4.440183639526367, 5.081258773803711, 5.7223334312438965, 6.363408088684082, 7.004482746124268, 7.645557403564453, 8.286632537841797, 8.92770767211914, 9.568781852722168, 10.209856986999512, 10.850931167602539, 11.492006301879883, 12.133081436157227, 12.774155616760254, 13.415230751037598, 14.056304931640625, 14.697380065917969, 15.338455200195312, 15.979530334472656, 16.62060546875, 17.261680603027344, 17.902755737304688, 18.5438289642334, 19.184904098510742, 19.825979232788086, 20.46705436706543, 21.108129501342773, 21.749202728271484]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 4.0, 6.0, 9.0, 11.0, 8.0, 19.0, 11.0, 11.0, 16.0, 16.0, 25.0, 21.0, 17.0, 22.0, 21.0, 37.0, 29.0, 22.0, 31.0, 27.0, 33.0, 32.0, 40.0, 39.0, 41.0, 41.0, 35.0, 42.0, 34.0, 24.0, 31.0, 32.0, 19.0, 13.0, 21.0, 20.0, 10.0, 21.0, 11.0, 9.0, 20.0, 13.0, 12.0, 5.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0], "bins": [-19.8543701171875, -19.280012130737305, -18.70565414428711, -18.131298065185547, -17.55694007873535, -16.982582092285156, -16.40822410583496, -15.833866119384766, -15.259509086608887, -14.685151100158691, -14.110794067382812, -13.536436080932617, -12.962078094482422, -12.387721061706543, -11.813363075256348, -11.239006042480469, -10.664648056030273, -10.090290069580078, -9.5159330368042, -8.941575050354004, -8.367218017578125, -7.79286003112793, -7.218502044677734, -6.644144535064697, -6.06978702545166, -5.495429515838623, -4.921072006225586, -4.346714019775391, -3.7723565101623535, -3.1979990005493164, -2.6236412525177, -2.049283504486084, -1.4749279022216797, -0.900570273399353, -0.32621264457702637, 0.2481449842453003, 0.822502613067627, 1.396860122680664, 1.9712178707122803, 2.5455756187438965, 3.1199331283569336, 3.6942906379699707, 4.268648147583008, 4.843006134033203, 5.41736364364624, 5.991721153259277, 6.566079139709473, 7.14043664932251, 7.714794158935547, 8.289152145385742, 8.863509178161621, 9.437867164611816, 10.012224197387695, 10.58658218383789, 11.160940170288086, 11.735298156738281, 12.30965518951416, 12.884013175964355, 13.458370208740234, 14.03272819519043, 14.607086181640625, 15.181443214416504, 15.7558012008667, 16.330158233642578, 16.904516220092773]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 8.0, 10.0, 21.0, 29.0, 48.0, 71.0, 113.0, 205.0, 322.0, 433.0, 762.0, 1167.0, 1809.0, 2929.0, 4560.0, 7132.0, 11027.0, 17291.0, 25917.0, 38524.0, 55133.0, 75573.0, 95747.0, 112182.0, 119437.0, 114857.0, 100399.0, 80031.0, 59581.0, 41883.0, 28666.0, 19050.0, 12155.0, 7922.0, 5033.0, 3176.0, 1943.0, 1242.0, 761.0, 485.0, 321.0, 193.0, 135.0, 102.0, 66.0, 43.0, 27.0, 15.0, 10.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-9.9296875, -9.63427734375, -9.3388671875, -9.04345703125, -8.748046875, -8.45263671875, -8.1572265625, -7.86181640625, -7.56640625, -7.27099609375, -6.9755859375, -6.68017578125, -6.384765625, -6.08935546875, -5.7939453125, -5.49853515625, -5.203125, -4.90771484375, -4.6123046875, -4.31689453125, -4.021484375, -3.72607421875, -3.4306640625, -3.13525390625, -2.83984375, -2.54443359375, -2.2490234375, -1.95361328125, -1.658203125, -1.36279296875, -1.0673828125, -0.77197265625, -0.4765625, -0.18115234375, 0.1142578125, 0.40966796875, 0.705078125, 1.00048828125, 1.2958984375, 1.59130859375, 1.88671875, 2.18212890625, 2.4775390625, 2.77294921875, 3.068359375, 3.36376953125, 3.6591796875, 3.95458984375, 4.25, 4.54541015625, 4.8408203125, 5.13623046875, 5.431640625, 5.72705078125, 6.0224609375, 6.31787109375, 6.61328125, 6.90869140625, 7.2041015625, 7.49951171875, 7.794921875, 8.09033203125, 8.3857421875, 8.68115234375, 8.9765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 7.0, 10.0, 12.0, 12.0, 13.0, 17.0, 17.0, 21.0, 21.0, 17.0, 17.0, 31.0, 37.0, 37.0, 22.0, 32.0, 38.0, 33.0, 34.0, 48.0, 33.0, 37.0, 40.0, 33.0, 40.0, 37.0, 20.0, 30.0, 19.0, 25.0, 25.0, 18.0, 18.0, 20.0, 16.0, 14.0, 9.0, 9.0, 14.0, 8.0, 4.0, 4.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-21.09375, -20.477783203125, -19.86181640625, -19.245849609375, -18.6298828125, -18.013916015625, -17.39794921875, -16.781982421875, -16.166015625, -15.550048828125, -14.93408203125, -14.318115234375, -13.7021484375, -13.086181640625, -12.47021484375, -11.854248046875, -11.23828125, -10.622314453125, -10.00634765625, -9.390380859375, -8.7744140625, -8.158447265625, -7.54248046875, -6.926513671875, -6.310546875, -5.694580078125, -5.07861328125, -4.462646484375, -3.8466796875, -3.230712890625, -2.61474609375, -1.998779296875, -1.3828125, -0.766845703125, -0.15087890625, 0.465087890625, 1.0810546875, 1.697021484375, 2.31298828125, 2.928955078125, 3.544921875, 4.160888671875, 4.77685546875, 5.392822265625, 6.0087890625, 6.624755859375, 7.24072265625, 7.856689453125, 8.47265625, 9.088623046875, 9.70458984375, 10.320556640625, 10.9365234375, 11.552490234375, 12.16845703125, 12.784423828125, 13.400390625, 14.016357421875, 14.63232421875, 15.248291015625, 15.8642578125, 16.480224609375, 17.09619140625, 17.712158203125, 18.328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 12.0, 16.0, 25.0, 34.0, 63.0, 89.0, 148.0, 216.0, 319.0, 518.0, 815.0, 1227.0, 2065.0, 3450.0, 5522.0, 9096.0, 15294.0, 25120.0, 42439.0, 68167.0, 103790.0, 141304.0, 162339.0, 150405.0, 115429.0, 77399.0, 48721.0, 29390.0, 17724.0, 10750.0, 6469.0, 3924.0, 2387.0, 1401.0, 951.0, 610.0, 354.0, 214.0, 113.0, 78.0, 64.0, 40.0, 20.0, 21.0, 12.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.6015625, -15.12353515625, -14.6455078125, -14.16748046875, -13.689453125, -13.21142578125, -12.7333984375, -12.25537109375, -11.77734375, -11.29931640625, -10.8212890625, -10.34326171875, -9.865234375, -9.38720703125, -8.9091796875, -8.43115234375, -7.953125, -7.47509765625, -6.9970703125, -6.51904296875, -6.041015625, -5.56298828125, -5.0849609375, -4.60693359375, -4.12890625, -3.65087890625, -3.1728515625, -2.69482421875, -2.216796875, -1.73876953125, -1.2607421875, -0.78271484375, -0.3046875, 0.17333984375, 0.6513671875, 1.12939453125, 1.607421875, 2.08544921875, 2.5634765625, 3.04150390625, 3.51953125, 3.99755859375, 4.4755859375, 4.95361328125, 5.431640625, 5.90966796875, 6.3876953125, 6.86572265625, 7.34375, 7.82177734375, 8.2998046875, 8.77783203125, 9.255859375, 9.73388671875, 10.2119140625, 10.68994140625, 11.16796875, 11.64599609375, 12.1240234375, 12.60205078125, 13.080078125, 13.55810546875, 14.0361328125, 14.51416015625, 14.9921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 7.0, 8.0, 8.0, 15.0, 13.0, 15.0, 20.0, 15.0, 25.0, 20.0, 35.0, 33.0, 38.0, 29.0, 28.0, 36.0, 41.0, 42.0, 39.0, 44.0, 53.0, 44.0, 36.0, 31.0, 44.0, 32.0, 37.0, 33.0, 23.0, 28.0, 20.0, 18.0, 18.0, 9.0, 15.0, 9.0, 9.0, 11.0, 9.0, 5.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -11.9527587890625, -11.507080078125, -11.0614013671875, -10.61572265625, -10.1700439453125, -9.724365234375, -9.2786865234375, -8.8330078125, -8.3873291015625, -7.941650390625, -7.4959716796875, -7.05029296875, -6.6046142578125, -6.158935546875, -5.7132568359375, -5.267578125, -4.8218994140625, -4.376220703125, -3.9305419921875, -3.48486328125, -3.0391845703125, -2.593505859375, -2.1478271484375, -1.7021484375, -1.2564697265625, -0.810791015625, -0.3651123046875, 0.08056640625, 0.5262451171875, 0.971923828125, 1.4176025390625, 1.86328125, 2.3089599609375, 2.754638671875, 3.2003173828125, 3.64599609375, 4.0916748046875, 4.537353515625, 4.9830322265625, 5.4287109375, 5.8743896484375, 6.320068359375, 6.7657470703125, 7.21142578125, 7.6571044921875, 8.102783203125, 8.5484619140625, 8.994140625, 9.4398193359375, 9.885498046875, 10.3311767578125, 10.77685546875, 11.2225341796875, 11.668212890625, 12.1138916015625, 12.5595703125, 13.0052490234375, 13.450927734375, 13.8966064453125, 14.34228515625, 14.7879638671875, 15.233642578125, 15.6793212890625, 16.125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 9.0, 18.0, 24.0, 22.0, 42.0, 40.0, 71.0, 103.0, 160.0, 246.0, 379.0, 637.0, 1096.0, 1930.0, 3486.0, 6456.0, 12233.0, 23451.0, 44520.0, 82758.0, 139284.0, 194460.0, 198845.0, 147069.0, 88808.0, 48543.0, 25034.0, 13071.0, 7013.0, 3698.0, 2018.0, 1204.0, 642.0, 402.0, 258.0, 169.0, 96.0, 90.0, 36.0, 22.0, 20.0, 28.0, 12.0, 9.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.98046875, -7.72357177734375, -7.4666748046875, -7.20977783203125, -6.952880859375, -6.69598388671875, -6.4390869140625, -6.18218994140625, -5.92529296875, -5.66839599609375, -5.4114990234375, -5.15460205078125, -4.897705078125, -4.64080810546875, -4.3839111328125, -4.12701416015625, -3.8701171875, -3.61322021484375, -3.3563232421875, -3.09942626953125, -2.842529296875, -2.58563232421875, -2.3287353515625, -2.07183837890625, -1.81494140625, -1.55804443359375, -1.3011474609375, -1.04425048828125, -0.787353515625, -0.53045654296875, -0.2735595703125, -0.01666259765625, 0.240234375, 0.49713134765625, 0.7540283203125, 1.01092529296875, 1.267822265625, 1.52471923828125, 1.7816162109375, 2.03851318359375, 2.29541015625, 2.55230712890625, 2.8092041015625, 3.06610107421875, 3.322998046875, 3.57989501953125, 3.8367919921875, 4.09368896484375, 4.3505859375, 4.60748291015625, 4.8643798828125, 5.12127685546875, 5.378173828125, 5.63507080078125, 5.8919677734375, 6.14886474609375, 6.40576171875, 6.66265869140625, 6.9195556640625, 7.17645263671875, 7.433349609375, 7.69024658203125, 7.9471435546875, 8.20404052734375, 8.4609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 2.0, 7.0, 7.0, 2.0, 12.0, 9.0, 17.0, 22.0, 26.0, 26.0, 35.0, 49.0, 44.0, 43.0, 57.0, 56.0, 62.0, 62.0, 55.0, 51.0, 51.0, 52.0, 38.0, 35.0, 24.0, 37.0, 16.0, 15.0, 27.0, 13.0, 7.0, 9.0, 9.0, 4.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.00049591064453125, -0.0004831776022911072, -0.00047044456005096436, -0.00045771151781082153, -0.0004449784755706787, -0.0004322454333305359, -0.00041951239109039307, -0.00040677934885025024, -0.0003940463066101074, -0.0003813132643699646, -0.0003685802221298218, -0.00035584717988967896, -0.00034311413764953613, -0.0003303810954093933, -0.0003176480531692505, -0.00030491501092910767, -0.00029218196868896484, -0.000279448926448822, -0.0002667158842086792, -0.0002539828419685364, -0.00024124979972839355, -0.00022851675748825073, -0.0002157837152481079, -0.0002030506730079651, -0.00019031763076782227, -0.00017758458852767944, -0.00016485154628753662, -0.0001521185040473938, -0.00013938546180725098, -0.00012665241956710815, -0.00011391937732696533, -0.00010118633508682251, -8.845329284667969e-05, -7.572025060653687e-05, -6.298720836639404e-05, -5.025416612625122e-05, -3.75211238861084e-05, -2.4788081645965576e-05, -1.2055039405822754e-05, 6.780028343200684e-07, 1.341104507446289e-05, 2.6144087314605713e-05, 3.8877129554748535e-05, 5.161017179489136e-05, 6.434321403503418e-05, 7.7076256275177e-05, 8.980929851531982e-05, 0.00010254234075546265, 0.00011527538299560547, 0.0001280084252357483, 0.0001407414674758911, 0.00015347450971603394, 0.00016620755195617676, 0.00017894059419631958, 0.0001916736364364624, 0.00020440667867660522, 0.00021713972091674805, 0.00022987276315689087, 0.0002426058053970337, 0.0002553388476371765, 0.00026807188987731934, 0.00028080493211746216, 0.000293537974357605, 0.0003062710165977478, 0.0003190040588378906]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 10.0, 5.0, 11.0, 13.0, 26.0, 28.0, 45.0, 64.0, 87.0, 137.0, 163.0, 247.0, 358.0, 598.0, 813.0, 1308.0, 2035.0, 3419.0, 5545.0, 9307.0, 15840.0, 26860.0, 44827.0, 71412.0, 105177.0, 137797.0, 154016.0, 144651.0, 114348.0, 80418.0, 51410.0, 31214.0, 18420.0, 10998.0, 6430.0, 3858.0, 2279.0, 1477.0, 912.0, 603.0, 401.0, 313.0, 221.0, 125.0, 101.0, 70.0, 48.0, 37.0, 28.0, 17.0, 14.0, 12.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.359375, -8.103271484375, -7.84716796875, -7.591064453125, -7.3349609375, -7.078857421875, -6.82275390625, -6.566650390625, -6.310546875, -6.054443359375, -5.79833984375, -5.542236328125, -5.2861328125, -5.030029296875, -4.77392578125, -4.517822265625, -4.26171875, -4.005615234375, -3.74951171875, -3.493408203125, -3.2373046875, -2.981201171875, -2.72509765625, -2.468994140625, -2.212890625, -1.956787109375, -1.70068359375, -1.444580078125, -1.1884765625, -0.932373046875, -0.67626953125, -0.420166015625, -0.1640625, 0.092041015625, 0.34814453125, 0.604248046875, 0.8603515625, 1.116455078125, 1.37255859375, 1.628662109375, 1.884765625, 2.140869140625, 2.39697265625, 2.653076171875, 2.9091796875, 3.165283203125, 3.42138671875, 3.677490234375, 3.93359375, 4.189697265625, 4.44580078125, 4.701904296875, 4.9580078125, 5.214111328125, 5.47021484375, 5.726318359375, 5.982421875, 6.238525390625, 6.49462890625, 6.750732421875, 7.0068359375, 7.262939453125, 7.51904296875, 7.775146484375, 8.03125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 1.0, 6.0, 3.0, 5.0, 16.0, 8.0, 8.0, 16.0, 13.0, 19.0, 27.0, 26.0, 27.0, 39.0, 36.0, 57.0, 59.0, 44.0, 57.0, 51.0, 40.0, 49.0, 58.0, 45.0, 42.0, 41.0, 37.0, 34.0, 28.0, 17.0, 17.0, 10.0, 12.0, 13.0, 8.0, 4.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.623443603515625, -2.53204345703125, -2.440643310546875, -2.3492431640625, -2.257843017578125, -2.16644287109375, -2.075042724609375, -1.983642578125, -1.892242431640625, -1.80084228515625, -1.709442138671875, -1.6180419921875, -1.526641845703125, -1.43524169921875, -1.343841552734375, -1.25244140625, -1.161041259765625, -1.06964111328125, -0.978240966796875, -0.8868408203125, -0.795440673828125, -0.70404052734375, -0.612640380859375, -0.521240234375, -0.429840087890625, -0.33843994140625, -0.247039794921875, -0.1556396484375, -0.064239501953125, 0.02716064453125, 0.118560791015625, 0.2099609375, 0.301361083984375, 0.39276123046875, 0.484161376953125, 0.5755615234375, 0.666961669921875, 0.75836181640625, 0.849761962890625, 0.941162109375, 1.032562255859375, 1.12396240234375, 1.215362548828125, 1.3067626953125, 1.398162841796875, 1.48956298828125, 1.580963134765625, 1.67236328125, 1.763763427734375, 1.85516357421875, 1.946563720703125, 2.0379638671875, 2.129364013671875, 2.22076416015625, 2.312164306640625, 2.403564453125, 2.494964599609375, 2.58636474609375, 2.677764892578125, 2.7691650390625, 2.860565185546875, 2.95196533203125, 3.043365478515625, 3.134765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 2.0, 5.0, 1.0, 4.0, 7.0, 8.0, 9.0, 15.0, 13.0, 12.0, 17.0, 27.0, 24.0, 15.0, 27.0, 23.0, 38.0, 38.0, 34.0, 37.0, 39.0, 38.0, 47.0, 45.0, 46.0, 47.0, 35.0, 35.0, 28.0, 31.0, 23.0, 31.0, 21.0, 27.0, 19.0, 19.0, 17.0, 9.0, 17.0, 10.0, 10.0, 7.0, 12.0, 2.0, 8.0, 4.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-19.51545524597168, -18.891408920288086, -18.267362594604492, -17.643314361572266, -17.019268035888672, -16.395221710205078, -15.771175384521484, -15.14712905883789, -14.52308177947998, -13.899035453796387, -13.274988174438477, -12.650941848754883, -12.026895523071289, -11.402848243713379, -10.778801918029785, -10.154754638671875, -9.530708312988281, -8.906661987304688, -8.282614707946777, -7.658568382263184, -7.034521579742432, -6.41047477722168, -5.786428451538086, -5.162381649017334, -4.538334846496582, -3.91428804397583, -3.2902414798736572, -2.6661949157714844, -2.0421481132507324, -1.4181013107299805, -0.7940547466278076, -0.17000818252563477, 0.45404052734375, 1.0780872106552124, 1.7021338939666748, 2.3261804580688477, 2.9502272605895996, 3.5742740631103516, 4.198320388793945, 4.822367191314697, 5.446413993835449, 6.070460796356201, 6.694507598876953, 7.318553924560547, 7.942600727081299, 8.56664752960205, 9.190693855285645, 9.814741134643555, 10.438787460327148, 11.062833786010742, 11.686881065368652, 12.310927391052246, 12.934974670410156, 13.55902099609375, 14.183067321777344, 14.807113647460938, 15.431160926818848, 16.055208206176758, 16.67925453186035, 17.303300857543945, 17.92734718322754, 18.551395416259766, 19.17544174194336, 19.799488067626953, 20.423534393310547]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 7.0, 5.0, 9.0, 13.0, 7.0, 13.0, 14.0, 12.0, 17.0, 13.0, 16.0, 25.0, 27.0, 20.0, 23.0, 26.0, 40.0, 31.0, 20.0, 33.0, 33.0, 35.0, 42.0, 39.0, 30.0, 43.0, 32.0, 45.0, 26.0, 39.0, 26.0, 27.0, 25.0, 20.0, 17.0, 13.0, 15.0, 20.0, 13.0, 12.0, 16.0, 12.0, 9.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-20.018753051757812, -19.439897537231445, -18.86104393005371, -18.282188415527344, -17.703332901000977, -17.124479293823242, -16.545623779296875, -15.966769218444824, -15.387914657592773, -14.809060096740723, -14.230204582214355, -13.651350021362305, -13.072495460510254, -12.493640899658203, -11.914785385131836, -11.335930824279785, -10.757075309753418, -10.178220748901367, -9.599365234375, -9.02051067352295, -8.441656112670898, -7.8628010749816895, -7.2839460372924805, -6.70509147644043, -6.126236438751221, -5.547381401062012, -4.968526840209961, -4.389671802520752, -3.810817003250122, -3.231962203979492, -2.653107166290283, -2.0742526054382324, -1.4953975677490234, -0.9165427088737488, -0.3376878499984741, 0.2411670684814453, 0.8200218677520752, 1.398876667022705, 1.977731704711914, 2.556586265563965, 3.135441303253174, 3.7142961025238037, 4.293150901794434, 4.872005939483643, 5.450860977172852, 6.029715538024902, 6.608570575714111, 7.187425136566162, 7.766280174255371, 8.345134735107422, 8.923990249633789, 9.50284481048584, 10.08169937133789, 10.660554885864258, 11.239409446716309, 11.81826400756836, 12.397119522094727, 12.975974082946777, 13.554829597473145, 14.133684158325195, 14.712538719177246, 15.291393280029297, 15.870248794555664, 16.44910430908203, 17.027957916259766]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 11.0, 14.0, 26.0, 46.0, 49.0, 108.0, 181.0, 307.0, 489.0, 850.0, 1372.0, 2363.0, 3842.0, 6286.0, 9956.0, 15668.0, 24462.0, 36565.0, 53368.0, 72962.0, 93622.0, 110575.0, 119520.0, 116930.0, 103155.0, 83288.0, 63385.0, 45237.0, 30547.0, 20001.0, 12554.0, 8068.0, 5033.0, 3056.0, 1879.0, 1105.0, 705.0, 390.0, 230.0, 150.0, 91.0, 52.0, 23.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9453125, -13.4920654296875, -13.038818359375, -12.5855712890625, -12.13232421875, -11.6790771484375, -11.225830078125, -10.7725830078125, -10.3193359375, -9.8660888671875, -9.412841796875, -8.9595947265625, -8.50634765625, -8.0531005859375, -7.599853515625, -7.1466064453125, -6.693359375, -6.2401123046875, -5.786865234375, -5.3336181640625, -4.88037109375, -4.4271240234375, -3.973876953125, -3.5206298828125, -3.0673828125, -2.6141357421875, -2.160888671875, -1.7076416015625, -1.25439453125, -0.8011474609375, -0.347900390625, 0.1053466796875, 0.55859375, 1.0118408203125, 1.465087890625, 1.9183349609375, 2.37158203125, 2.8248291015625, 3.278076171875, 3.7313232421875, 4.1845703125, 4.6378173828125, 5.091064453125, 5.5443115234375, 5.99755859375, 6.4508056640625, 6.904052734375, 7.3572998046875, 7.810546875, 8.2637939453125, 8.717041015625, 9.1702880859375, 9.62353515625, 10.0767822265625, 10.530029296875, 10.9832763671875, 11.4365234375, 11.8897705078125, 12.343017578125, 12.7962646484375, 13.24951171875, 13.7027587890625, 14.156005859375, 14.6092529296875, 15.0625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 0.0, 6.0, 3.0, 6.0, 5.0, 8.0, 4.0, 3.0, 10.0, 11.0, 20.0, 11.0, 15.0, 19.0, 18.0, 27.0, 23.0, 27.0, 25.0, 32.0, 30.0, 37.0, 38.0, 31.0, 36.0, 54.0, 49.0, 39.0, 43.0, 33.0, 44.0, 34.0, 44.0, 17.0, 24.0, 18.0, 21.0, 14.0, 27.0, 14.0, 18.0, 12.0, 16.0, 11.0, 3.0, 9.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.671875, -21.025634765625, -20.37939453125, -19.733154296875, -19.0869140625, -18.440673828125, -17.79443359375, -17.148193359375, -16.501953125, -15.855712890625, -15.20947265625, -14.563232421875, -13.9169921875, -13.270751953125, -12.62451171875, -11.978271484375, -11.33203125, -10.685791015625, -10.03955078125, -9.393310546875, -8.7470703125, -8.100830078125, -7.45458984375, -6.808349609375, -6.162109375, -5.515869140625, -4.86962890625, -4.223388671875, -3.5771484375, -2.930908203125, -2.28466796875, -1.638427734375, -0.9921875, -0.345947265625, 0.30029296875, 0.946533203125, 1.5927734375, 2.239013671875, 2.88525390625, 3.531494140625, 4.177734375, 4.823974609375, 5.47021484375, 6.116455078125, 6.7626953125, 7.408935546875, 8.05517578125, 8.701416015625, 9.34765625, 9.993896484375, 10.64013671875, 11.286376953125, 11.9326171875, 12.578857421875, 13.22509765625, 13.871337890625, 14.517578125, 15.163818359375, 15.81005859375, 16.456298828125, 17.1025390625, 17.748779296875, 18.39501953125, 19.041259765625, 19.6875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 10.0, 4.0, 11.0, 15.0, 30.0, 55.0, 78.0, 125.0, 193.0, 323.0, 562.0, 822.0, 1475.0, 2215.0, 3533.0, 5694.0, 9035.0, 13956.0, 21543.0, 31749.0, 45492.0, 62618.0, 80861.0, 97713.0, 109519.0, 112944.0, 106514.0, 92483.0, 74089.0, 56215.0, 40206.0, 27434.0, 18253.0, 12032.0, 7807.0, 4989.0, 3121.0, 1848.0, 1156.0, 724.0, 420.0, 280.0, 172.0, 91.0, 59.0, 37.0, 23.0, 16.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.6640625, -15.1939697265625, -14.723876953125, -14.2537841796875, -13.78369140625, -13.3135986328125, -12.843505859375, -12.3734130859375, -11.9033203125, -11.4332275390625, -10.963134765625, -10.4930419921875, -10.02294921875, -9.5528564453125, -9.082763671875, -8.6126708984375, -8.142578125, -7.6724853515625, -7.202392578125, -6.7322998046875, -6.26220703125, -5.7921142578125, -5.322021484375, -4.8519287109375, -4.3818359375, -3.9117431640625, -3.441650390625, -2.9715576171875, -2.50146484375, -2.0313720703125, -1.561279296875, -1.0911865234375, -0.62109375, -0.1510009765625, 0.319091796875, 0.7891845703125, 1.25927734375, 1.7293701171875, 2.199462890625, 2.6695556640625, 3.1396484375, 3.6097412109375, 4.079833984375, 4.5499267578125, 5.02001953125, 5.4901123046875, 5.960205078125, 6.4302978515625, 6.900390625, 7.3704833984375, 7.840576171875, 8.3106689453125, 8.78076171875, 9.2508544921875, 9.720947265625, 10.1910400390625, 10.6611328125, 11.1312255859375, 11.601318359375, 12.0714111328125, 12.54150390625, 13.0115966796875, 13.481689453125, 13.9517822265625, 14.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 9.0, 13.0, 15.0, 9.0, 18.0, 16.0, 22.0, 20.0, 28.0, 22.0, 24.0, 32.0, 36.0, 33.0, 38.0, 31.0, 46.0, 39.0, 43.0, 33.0, 44.0, 48.0, 41.0, 35.0, 38.0, 34.0, 19.0, 23.0, 23.0, 26.0, 23.0, 10.0, 14.0, 12.0, 19.0, 7.0, 11.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9921875, -12.5660400390625, -12.139892578125, -11.7137451171875, -11.28759765625, -10.8614501953125, -10.435302734375, -10.0091552734375, -9.5830078125, -9.1568603515625, -8.730712890625, -8.3045654296875, -7.87841796875, -7.4522705078125, -7.026123046875, -6.5999755859375, -6.173828125, -5.7476806640625, -5.321533203125, -4.8953857421875, -4.46923828125, -4.0430908203125, -3.616943359375, -3.1907958984375, -2.7646484375, -2.3385009765625, -1.912353515625, -1.4862060546875, -1.06005859375, -0.6339111328125, -0.207763671875, 0.2183837890625, 0.64453125, 1.0706787109375, 1.496826171875, 1.9229736328125, 2.34912109375, 2.7752685546875, 3.201416015625, 3.6275634765625, 4.0537109375, 4.4798583984375, 4.906005859375, 5.3321533203125, 5.75830078125, 6.1844482421875, 6.610595703125, 7.0367431640625, 7.462890625, 7.8890380859375, 8.315185546875, 8.7413330078125, 9.16748046875, 9.5936279296875, 10.019775390625, 10.4459228515625, 10.8720703125, 11.2982177734375, 11.724365234375, 12.1505126953125, 12.57666015625, 13.0028076171875, 13.428955078125, 13.8551025390625, 14.28125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 8.0, 15.0, 29.0, 64.0, 77.0, 150.0, 243.0, 375.0, 680.0, 1018.0, 1830.0, 2989.0, 4889.0, 8126.0, 12700.0, 19978.0, 30676.0, 44841.0, 62925.0, 83437.0, 102933.0, 116243.0, 118591.0, 110149.0, 93623.0, 73800.0, 54065.0, 37189.0, 24929.0, 15888.0, 10081.0, 6198.0, 3946.0, 2329.0, 1396.0, 850.0, 484.0, 311.0, 208.0, 106.0, 60.0, 58.0, 27.0, 15.0, 13.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.8870849609375, -4.707763671875, -4.5284423828125, -4.34912109375, -4.1697998046875, -3.990478515625, -3.8111572265625, -3.6318359375, -3.4525146484375, -3.273193359375, -3.0938720703125, -2.91455078125, -2.7352294921875, -2.555908203125, -2.3765869140625, -2.197265625, -2.0179443359375, -1.838623046875, -1.6593017578125, -1.47998046875, -1.3006591796875, -1.121337890625, -0.9420166015625, -0.7626953125, -0.5833740234375, -0.404052734375, -0.2247314453125, -0.04541015625, 0.1339111328125, 0.313232421875, 0.4925537109375, 0.671875, 0.8511962890625, 1.030517578125, 1.2098388671875, 1.38916015625, 1.5684814453125, 1.747802734375, 1.9271240234375, 2.1064453125, 2.2857666015625, 2.465087890625, 2.6444091796875, 2.82373046875, 3.0030517578125, 3.182373046875, 3.3616943359375, 3.541015625, 3.7203369140625, 3.899658203125, 4.0789794921875, 4.25830078125, 4.4376220703125, 4.616943359375, 4.7962646484375, 4.9755859375, 5.1549072265625, 5.334228515625, 5.5135498046875, 5.69287109375, 5.8721923828125, 6.051513671875, 6.2308349609375, 6.41015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 7.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 8.0, 11.0, 6.0, 17.0, 19.0, 17.0, 29.0, 36.0, 36.0, 24.0, 34.0, 44.0, 54.0, 44.0, 46.0, 54.0, 34.0, 48.0, 46.0, 30.0, 37.0, 42.0, 27.0, 28.0, 33.0, 18.0, 35.0, 16.0, 19.0, 12.0, 16.0, 17.0, 7.0, 9.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006513595581054688, -0.0006301775574684143, -0.0006089955568313599, -0.0005878135561943054, -0.000566631555557251, -0.0005454495549201965, -0.0005242675542831421, -0.0005030855536460876, -0.0004819035530090332, -0.00046072155237197876, -0.0004395395517349243, -0.0004183575510978699, -0.00039717555046081543, -0.000375993549823761, -0.00035481154918670654, -0.0003336295485496521, -0.00031244754791259766, -0.0002912655472755432, -0.00027008354663848877, -0.0002489015460014343, -0.00022771954536437988, -0.00020653754472732544, -0.000185355544090271, -0.00016417354345321655, -0.0001429915428161621, -0.00012180954217910767, -0.00010062754154205322, -7.944554090499878e-05, -5.8263540267944336e-05, -3.708153963088989e-05, -1.589953899383545e-05, 5.282461643218994e-06, 2.6464462280273438e-05, 4.764646291732788e-05, 6.882846355438232e-05, 9.001046419143677e-05, 0.00011119246482849121, 0.00013237446546554565, 0.0001535564661026001, 0.00017473846673965454, 0.00019592046737670898, 0.00021710246801376343, 0.00023828446865081787, 0.0002594664692878723, 0.00028064846992492676, 0.0003018304705619812, 0.00032301247119903564, 0.0003441944718360901, 0.00036537647247314453, 0.000386558473110199, 0.0004077404737472534, 0.00042892247438430786, 0.0004501044750213623, 0.00047128647565841675, 0.0004924684762954712, 0.0005136504769325256, 0.0005348324775695801, 0.0005560144782066345, 0.000577196478843689, 0.0005983784794807434, 0.0006195604801177979, 0.0006407424807548523, 0.0006619244813919067, 0.0006831064820289612, 0.0007042884826660156]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 16.0, 18.0, 21.0, 28.0, 55.0, 98.0, 152.0, 216.0, 342.0, 619.0, 929.0, 1523.0, 2264.0, 3727.0, 5712.0, 8896.0, 13386.0, 20478.0, 30127.0, 42766.0, 58227.0, 75798.0, 92795.0, 105797.0, 110423.0, 105760.0, 94507.0, 77447.0, 59790.0, 44474.0, 31135.0, 21157.0, 14055.0, 9393.0, 5910.0, 3947.0, 2470.0, 1542.0, 967.0, 577.0, 368.0, 245.0, 151.0, 88.0, 64.0, 29.0, 28.0, 18.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.46484375, -5.2916259765625, -5.118408203125, -4.9451904296875, -4.77197265625, -4.5987548828125, -4.425537109375, -4.2523193359375, -4.0791015625, -3.9058837890625, -3.732666015625, -3.5594482421875, -3.38623046875, -3.2130126953125, -3.039794921875, -2.8665771484375, -2.693359375, -2.5201416015625, -2.346923828125, -2.1737060546875, -2.00048828125, -1.8272705078125, -1.654052734375, -1.4808349609375, -1.3076171875, -1.1343994140625, -0.961181640625, -0.7879638671875, -0.61474609375, -0.4415283203125, -0.268310546875, -0.0950927734375, 0.078125, 0.2513427734375, 0.424560546875, 0.5977783203125, 0.77099609375, 0.9442138671875, 1.117431640625, 1.2906494140625, 1.4638671875, 1.6370849609375, 1.810302734375, 1.9835205078125, 2.15673828125, 2.3299560546875, 2.503173828125, 2.6763916015625, 2.849609375, 3.0228271484375, 3.196044921875, 3.3692626953125, 3.54248046875, 3.7156982421875, 3.888916015625, 4.0621337890625, 4.2353515625, 4.4085693359375, 4.581787109375, 4.7550048828125, 4.92822265625, 5.1014404296875, 5.274658203125, 5.4478759765625, 5.62109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 2.0, 9.0, 7.0, 9.0, 18.0, 16.0, 18.0, 19.0, 23.0, 29.0, 26.0, 23.0, 30.0, 34.0, 48.0, 44.0, 38.0, 52.0, 54.0, 55.0, 45.0, 40.0, 51.0, 45.0, 44.0, 34.0, 27.0, 27.0, 17.0, 19.0, 15.0, 19.0, 15.0, 9.0, 11.0, 4.0, 5.0, 8.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5, -2.42596435546875, -2.3519287109375, -2.27789306640625, -2.203857421875, -2.12982177734375, -2.0557861328125, -1.98175048828125, -1.90771484375, -1.83367919921875, -1.7596435546875, -1.68560791015625, -1.611572265625, -1.53753662109375, -1.4635009765625, -1.38946533203125, -1.3154296875, -1.24139404296875, -1.1673583984375, -1.09332275390625, -1.019287109375, -0.94525146484375, -0.8712158203125, -0.79718017578125, -0.72314453125, -0.64910888671875, -0.5750732421875, -0.50103759765625, -0.427001953125, -0.35296630859375, -0.2789306640625, -0.20489501953125, -0.130859375, -0.05682373046875, 0.0172119140625, 0.09124755859375, 0.165283203125, 0.23931884765625, 0.3133544921875, 0.38739013671875, 0.46142578125, 0.53546142578125, 0.6094970703125, 0.68353271484375, 0.757568359375, 0.83160400390625, 0.9056396484375, 0.97967529296875, 1.0537109375, 1.12774658203125, 1.2017822265625, 1.27581787109375, 1.349853515625, 1.42388916015625, 1.4979248046875, 1.57196044921875, 1.64599609375, 1.72003173828125, 1.7940673828125, 1.86810302734375, 1.942138671875, 2.01617431640625, 2.0902099609375, 2.16424560546875, 2.23828125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 7.0, 3.0, 7.0, 9.0, 10.0, 10.0, 14.0, 10.0, 16.0, 29.0, 12.0, 30.0, 24.0, 33.0, 29.0, 26.0, 42.0, 44.0, 50.0, 31.0, 52.0, 42.0, 44.0, 54.0, 35.0, 33.0, 36.0, 30.0, 34.0, 33.0, 22.0, 25.0, 16.0, 18.0, 6.0, 18.0, 12.0, 10.0, 6.0, 5.0, 8.0, 2.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.590803146362305, -19.92736053466797, -19.263916015625, -18.600473403930664, -17.937030792236328, -17.27358627319336, -16.610143661499023, -15.946701049804688, -15.283257484436035, -14.619813919067383, -13.956371307373047, -13.292927742004395, -12.629484176635742, -11.966041564941406, -11.302597999572754, -10.639154434204102, -9.975711822509766, -9.312268257141113, -8.648825645446777, -7.985382080078125, -7.321938991546631, -6.658495903015137, -5.995052337646484, -5.33160924911499, -4.668166160583496, -4.004723072052002, -3.3412797451019287, -2.6778364181518555, -2.0143933296203613, -1.3509502410888672, -0.687506914138794, -0.024063587188720703, 0.6393775939941406, 1.3028208017349243, 1.966264009475708, 2.6297073364257812, 3.2931504249572754, 3.9565935134887695, 4.620037078857422, 5.283480167388916, 5.94692325592041, 6.610366344451904, 7.273809432983398, 7.937252998352051, 8.600696563720703, 9.264139175415039, 9.927582740783691, 10.591026306152344, 11.25446891784668, 11.917912483215332, 12.581355094909668, 13.24479866027832, 13.908241271972656, 14.571684837341309, 15.235128402709961, 15.898571014404297, 16.562015533447266, 17.2254581451416, 17.88890266418457, 18.552345275878906, 19.215787887573242, 19.879230499267578, 20.542675018310547, 21.206117630004883, 21.86956024169922]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 6.0, 11.0, 6.0, 15.0, 15.0, 9.0, 19.0, 22.0, 24.0, 25.0, 27.0, 39.0, 31.0, 31.0, 40.0, 34.0, 44.0, 38.0, 40.0, 46.0, 36.0, 35.0, 36.0, 39.0, 40.0, 41.0, 25.0, 30.0, 28.0, 21.0, 30.0, 10.0, 19.0, 15.0, 12.0, 9.0, 14.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-27.00551986694336, -26.270401000976562, -25.535280227661133, -24.800161361694336, -24.06504249572754, -23.32992172241211, -22.594802856445312, -21.859683990478516, -21.124563217163086, -20.38944435119629, -19.65432357788086, -18.919204711914062, -18.184085845947266, -17.448965072631836, -16.71384620666504, -15.978726387023926, -15.243607521057129, -14.508487701416016, -13.773368835449219, -13.038249015808105, -12.303129196166992, -11.568010330200195, -10.832890510559082, -10.097770690917969, -9.362651824951172, -8.627532005310059, -7.8924126625061035, -7.157293319702148, -6.422173500061035, -5.68705415725708, -4.951934814453125, -4.216814994812012, -3.4816951751708984, -2.7465755939483643, -2.01145601272583, -1.276336669921875, -0.5412170886993408, 0.19390249252319336, 0.9290218353271484, 1.6641416549682617, 2.399260997772217, 3.134380578994751, 3.869500160217285, 4.60461950302124, 5.339738845825195, 6.074858665466309, 6.809978008270264, 7.545097827911377, 8.280217170715332, 9.015336990356445, 9.750455856323242, 10.485575675964355, 11.220695495605469, 11.955814361572266, 12.690934181213379, 13.426054000854492, 14.161172866821289, 14.896292686462402, 15.6314115524292, 16.366531372070312, 17.10165023803711, 17.83677101135254, 18.571889877319336, 19.307010650634766, 20.042129516601562]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 14.0, 10.0, 20.0, 40.0, 47.0, 92.0, 128.0, 211.0, 269.0, 530.0, 789.0, 1307.0, 2133.0, 3686.0, 6347.0, 11826.0, 21783.0, 41220.0, 79851.0, 156247.0, 298798.0, 521158.0, 748789.0, 809105.0, 641556.0, 398323.0, 215609.0, 110678.0, 57137.0, 29572.0, 16137.0, 8744.0, 5010.0, 2834.0, 1623.0, 1002.0, 566.0, 383.0, 253.0, 146.0, 116.0, 69.0, 43.0, 28.0, 15.0, 11.0, 9.0, 6.0, 5.0, 5.0, 0.0, 1.0], "bins": [-28.5625, -27.751953125, -26.94140625, -26.130859375, -25.3203125, -24.509765625, -23.69921875, -22.888671875, -22.078125, -21.267578125, -20.45703125, -19.646484375, -18.8359375, -18.025390625, -17.21484375, -16.404296875, -15.59375, -14.783203125, -13.97265625, -13.162109375, -12.3515625, -11.541015625, -10.73046875, -9.919921875, -9.109375, -8.298828125, -7.48828125, -6.677734375, -5.8671875, -5.056640625, -4.24609375, -3.435546875, -2.625, -1.814453125, -1.00390625, -0.193359375, 0.6171875, 1.427734375, 2.23828125, 3.048828125, 3.859375, 4.669921875, 5.48046875, 6.291015625, 7.1015625, 7.912109375, 8.72265625, 9.533203125, 10.34375, 11.154296875, 11.96484375, 12.775390625, 13.5859375, 14.396484375, 15.20703125, 16.017578125, 16.828125, 17.638671875, 18.44921875, 19.259765625, 20.0703125, 20.880859375, 21.69140625, 22.501953125, 23.3125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 7.0, 7.0, 5.0, 7.0, 13.0, 12.0, 18.0, 19.0, 23.0, 21.0, 21.0, 22.0, 22.0, 41.0, 44.0, 41.0, 43.0, 36.0, 46.0, 44.0, 36.0, 42.0, 41.0, 26.0, 49.0, 30.0, 29.0, 31.0, 27.0, 26.0, 23.0, 18.0, 23.0, 26.0, 15.0, 12.0, 8.0, 10.0, 5.0, 10.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 2.0], "bins": [-25.609375, -24.91845703125, -24.2275390625, -23.53662109375, -22.845703125, -22.15478515625, -21.4638671875, -20.77294921875, -20.08203125, -19.39111328125, -18.7001953125, -18.00927734375, -17.318359375, -16.62744140625, -15.9365234375, -15.24560546875, -14.5546875, -13.86376953125, -13.1728515625, -12.48193359375, -11.791015625, -11.10009765625, -10.4091796875, -9.71826171875, -9.02734375, -8.33642578125, -7.6455078125, -6.95458984375, -6.263671875, -5.57275390625, -4.8818359375, -4.19091796875, -3.5, -2.80908203125, -2.1181640625, -1.42724609375, -0.736328125, -0.04541015625, 0.6455078125, 1.33642578125, 2.02734375, 2.71826171875, 3.4091796875, 4.10009765625, 4.791015625, 5.48193359375, 6.1728515625, 6.86376953125, 7.5546875, 8.24560546875, 8.9365234375, 9.62744140625, 10.318359375, 11.00927734375, 11.7001953125, 12.39111328125, 13.08203125, 13.77294921875, 14.4638671875, 15.15478515625, 15.845703125, 16.53662109375, 17.2275390625, 17.91845703125, 18.609375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 13.0, 13.0, 25.0, 33.0, 71.0, 90.0, 171.0, 277.0, 459.0, 788.0, 1342.0, 2340.0, 4335.0, 7482.0, 13443.0, 23883.0, 42960.0, 77640.0, 136351.0, 234831.0, 375326.0, 537195.0, 655231.0, 652117.0, 528861.0, 368432.0, 227708.0, 133038.0, 74839.0, 41959.0, 23174.0, 12870.0, 7250.0, 4090.0, 2363.0, 1434.0, 747.0, 447.0, 288.0, 159.0, 83.0, 51.0, 31.0, 17.0, 11.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.5, -23.6826171875, -22.865234375, -22.0478515625, -21.23046875, -20.4130859375, -19.595703125, -18.7783203125, -17.9609375, -17.1435546875, -16.326171875, -15.5087890625, -14.69140625, -13.8740234375, -13.056640625, -12.2392578125, -11.421875, -10.6044921875, -9.787109375, -8.9697265625, -8.15234375, -7.3349609375, -6.517578125, -5.7001953125, -4.8828125, -4.0654296875, -3.248046875, -2.4306640625, -1.61328125, -0.7958984375, 0.021484375, 0.8388671875, 1.65625, 2.4736328125, 3.291015625, 4.1083984375, 4.92578125, 5.7431640625, 6.560546875, 7.3779296875, 8.1953125, 9.0126953125, 9.830078125, 10.6474609375, 11.46484375, 12.2822265625, 13.099609375, 13.9169921875, 14.734375, 15.5517578125, 16.369140625, 17.1865234375, 18.00390625, 18.8212890625, 19.638671875, 20.4560546875, 21.2734375, 22.0908203125, 22.908203125, 23.7255859375, 24.54296875, 25.3603515625, 26.177734375, 26.9951171875, 27.8125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 9.0, 13.0, 14.0, 22.0, 25.0, 41.0, 47.0, 50.0, 55.0, 59.0, 84.0, 100.0, 103.0, 108.0, 129.0, 147.0, 179.0, 171.0, 182.0, 197.0, 204.0, 187.0, 200.0, 222.0, 197.0, 173.0, 159.0, 144.0, 134.0, 118.0, 112.0, 83.0, 79.0, 53.0, 61.0, 46.0, 33.0, 23.0, 21.0, 16.0, 19.0, 11.0, 6.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.921875, -8.6368408203125, -8.351806640625, -8.0667724609375, -7.78173828125, -7.4967041015625, -7.211669921875, -6.9266357421875, -6.6416015625, -6.3565673828125, -6.071533203125, -5.7864990234375, -5.50146484375, -5.2164306640625, -4.931396484375, -4.6463623046875, -4.361328125, -4.0762939453125, -3.791259765625, -3.5062255859375, -3.22119140625, -2.9361572265625, -2.651123046875, -2.3660888671875, -2.0810546875, -1.7960205078125, -1.510986328125, -1.2259521484375, -0.94091796875, -0.6558837890625, -0.370849609375, -0.0858154296875, 0.19921875, 0.4842529296875, 0.769287109375, 1.0543212890625, 1.33935546875, 1.6243896484375, 1.909423828125, 2.1944580078125, 2.4794921875, 2.7645263671875, 3.049560546875, 3.3345947265625, 3.61962890625, 3.9046630859375, 4.189697265625, 4.4747314453125, 4.759765625, 5.0447998046875, 5.329833984375, 5.6148681640625, 5.89990234375, 6.1849365234375, 6.469970703125, 6.7550048828125, 7.0400390625, 7.3250732421875, 7.610107421875, 7.8951416015625, 8.18017578125, 8.4652099609375, 8.750244140625, 9.0352783203125, 9.3203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 5.0, 6.0, 3.0, 8.0, 7.0, 4.0, 12.0, 15.0, 15.0, 17.0, 19.0, 24.0, 42.0, 37.0, 46.0, 47.0, 35.0, 54.0, 45.0, 40.0, 40.0, 43.0, 41.0, 50.0, 47.0, 37.0, 31.0, 24.0, 29.0, 25.0, 22.0, 25.0, 17.0, 19.0, 20.0, 10.0, 11.0, 4.0, 8.0, 2.0, 8.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.99365997314453, -27.18751335144043, -26.381364822387695, -25.575218200683594, -24.76906967163086, -23.962923049926758, -23.156776428222656, -22.350627899169922, -21.54448127746582, -20.73833465576172, -19.932186126708984, -19.126039505004883, -18.31989097595215, -17.513744354248047, -16.707595825195312, -15.901449203491211, -15.095301628112793, -14.289154052734375, -13.483006477355957, -12.676858901977539, -11.870712280273438, -11.06456470489502, -10.258417129516602, -9.4522705078125, -8.646121978759766, -7.839974403381348, -7.033827304840088, -6.22767972946167, -5.42153263092041, -4.615385055541992, -3.809237480163574, -3.0030903816223145, -2.1969432830810547, -1.3907959461212158, -0.5846484899520874, 0.22149896621704102, 1.0276463031768799, 1.8337936401367188, 2.6399412155151367, 3.4460883140563965, 4.2522358894348145, 5.058383464813232, 5.864530563354492, 6.67067813873291, 7.476825714111328, 8.28297233581543, 9.089120864868164, 9.895267486572266, 10.701415061950684, 11.507562637329102, 12.31371021270752, 13.119857788085938, 13.926004409790039, 14.732151985168457, 15.538299560546875, 16.344446182250977, 17.15059471130371, 17.956741333007812, 18.762889862060547, 19.56903648376465, 20.375185012817383, 21.181331634521484, 21.98748016357422, 22.79362678527832, 23.599773406982422]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 7.0, 4.0, 14.0, 12.0, 17.0, 22.0, 21.0, 28.0, 27.0, 23.0, 22.0, 30.0, 31.0, 30.0, 40.0, 34.0, 48.0, 29.0, 43.0, 38.0, 46.0, 47.0, 38.0, 43.0, 36.0, 29.0, 41.0, 25.0, 30.0, 21.0, 18.0, 22.0, 14.0, 11.0, 9.0, 8.0, 6.0, 10.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.282615661621094, -25.497875213623047, -24.713136672973633, -23.928396224975586, -23.14365577697754, -22.358917236328125, -21.574176788330078, -20.78943634033203, -20.004695892333984, -19.219955444335938, -18.435216903686523, -17.650476455688477, -16.86573600769043, -16.080997467041016, -15.296257019042969, -14.511516571044922, -13.726778030395508, -12.942038536071777, -12.15729808807373, -11.37255859375, -10.587818145751953, -9.803078651428223, -9.018339157104492, -8.233598709106445, -7.448859214782715, -6.664119243621826, -5.8793792724609375, -5.094639778137207, -4.309899806976318, -3.5251598358154297, -2.740420341491699, -1.9556803703308105, -1.1709403991699219, -0.38620054721832275, 0.39853930473327637, 1.183279037475586, 1.9680190086364746, 2.7527589797973633, 3.5374984741210938, 4.322238445281982, 5.106978416442871, 5.89171838760376, 6.676458358764648, 7.461197853088379, 8.24593734741211, 9.030677795410156, 9.815417289733887, 10.600156784057617, 11.384897232055664, 12.169636726379395, 12.954377174377441, 13.739116668701172, 14.523857116699219, 15.30859661102295, 16.09333610534668, 16.878076553344727, 17.66281509399414, 18.447555541992188, 19.2322940826416, 20.01703453063965, 20.801774978637695, 21.58651351928711, 22.371253967285156, 23.155994415283203, 23.94073486328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 9.0, 24.0, 24.0, 42.0, 42.0, 58.0, 110.0, 170.0, 234.0, 367.0, 489.0, 813.0, 1267.0, 1933.0, 3086.0, 5074.0, 8365.0, 13275.0, 21123.0, 33835.0, 52420.0, 76324.0, 104311.0, 127190.0, 136386.0, 127937.0, 105800.0, 78800.0, 54103.0, 35460.0, 22378.0, 13925.0, 8509.0, 5440.0, 3348.0, 2101.0, 1303.0, 815.0, 564.0, 360.0, 244.0, 146.0, 111.0, 79.0, 45.0, 39.0, 23.0, 15.0, 12.0, 5.0, 10.0, 7.0, 1.0, 0.0, 1.0], "bins": [-13.3984375, -12.9990234375, -12.599609375, -12.2001953125, -11.80078125, -11.4013671875, -11.001953125, -10.6025390625, -10.203125, -9.8037109375, -9.404296875, -9.0048828125, -8.60546875, -8.2060546875, -7.806640625, -7.4072265625, -7.0078125, -6.6083984375, -6.208984375, -5.8095703125, -5.41015625, -5.0107421875, -4.611328125, -4.2119140625, -3.8125, -3.4130859375, -3.013671875, -2.6142578125, -2.21484375, -1.8154296875, -1.416015625, -1.0166015625, -0.6171875, -0.2177734375, 0.181640625, 0.5810546875, 0.98046875, 1.3798828125, 1.779296875, 2.1787109375, 2.578125, 2.9775390625, 3.376953125, 3.7763671875, 4.17578125, 4.5751953125, 4.974609375, 5.3740234375, 5.7734375, 6.1728515625, 6.572265625, 6.9716796875, 7.37109375, 7.7705078125, 8.169921875, 8.5693359375, 8.96875, 9.3681640625, 9.767578125, 10.1669921875, 10.56640625, 10.9658203125, 11.365234375, 11.7646484375, 12.1640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 2.0, 4.0, 7.0, 10.0, 10.0, 8.0, 13.0, 16.0, 20.0, 20.0, 28.0, 24.0, 27.0, 39.0, 26.0, 30.0, 28.0, 33.0, 39.0, 46.0, 42.0, 36.0, 43.0, 49.0, 48.0, 46.0, 33.0, 35.0, 21.0, 33.0, 20.0, 26.0, 24.0, 27.0, 16.0, 16.0, 13.0, 7.0, 6.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-28.484375, -27.66845703125, -26.8525390625, -26.03662109375, -25.220703125, -24.40478515625, -23.5888671875, -22.77294921875, -21.95703125, -21.14111328125, -20.3251953125, -19.50927734375, -18.693359375, -17.87744140625, -17.0615234375, -16.24560546875, -15.4296875, -14.61376953125, -13.7978515625, -12.98193359375, -12.166015625, -11.35009765625, -10.5341796875, -9.71826171875, -8.90234375, -8.08642578125, -7.2705078125, -6.45458984375, -5.638671875, -4.82275390625, -4.0068359375, -3.19091796875, -2.375, -1.55908203125, -0.7431640625, 0.07275390625, 0.888671875, 1.70458984375, 2.5205078125, 3.33642578125, 4.15234375, 4.96826171875, 5.7841796875, 6.60009765625, 7.416015625, 8.23193359375, 9.0478515625, 9.86376953125, 10.6796875, 11.49560546875, 12.3115234375, 13.12744140625, 13.943359375, 14.75927734375, 15.5751953125, 16.39111328125, 17.20703125, 18.02294921875, 18.8388671875, 19.65478515625, 20.470703125, 21.28662109375, 22.1025390625, 22.91845703125, 23.734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 3.0, 6.0, 10.0, 13.0, 16.0, 28.0, 38.0, 68.0, 85.0, 142.0, 190.0, 312.0, 488.0, 833.0, 1290.0, 2261.0, 3908.0, 7212.0, 13401.0, 25124.0, 47375.0, 87754.0, 148690.0, 203232.0, 197630.0, 137954.0, 78929.0, 42149.0, 22359.0, 11772.0, 6454.0, 3568.0, 1998.0, 1176.0, 738.0, 444.0, 265.0, 229.0, 120.0, 95.0, 55.0, 41.0, 23.0, 21.0, 17.0, 10.0, 7.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.375, -24.60400390625, -23.8330078125, -23.06201171875, -22.291015625, -21.52001953125, -20.7490234375, -19.97802734375, -19.20703125, -18.43603515625, -17.6650390625, -16.89404296875, -16.123046875, -15.35205078125, -14.5810546875, -13.81005859375, -13.0390625, -12.26806640625, -11.4970703125, -10.72607421875, -9.955078125, -9.18408203125, -8.4130859375, -7.64208984375, -6.87109375, -6.10009765625, -5.3291015625, -4.55810546875, -3.787109375, -3.01611328125, -2.2451171875, -1.47412109375, -0.703125, 0.06787109375, 0.8388671875, 1.60986328125, 2.380859375, 3.15185546875, 3.9228515625, 4.69384765625, 5.46484375, 6.23583984375, 7.0068359375, 7.77783203125, 8.548828125, 9.31982421875, 10.0908203125, 10.86181640625, 11.6328125, 12.40380859375, 13.1748046875, 13.94580078125, 14.716796875, 15.48779296875, 16.2587890625, 17.02978515625, 17.80078125, 18.57177734375, 19.3427734375, 20.11376953125, 20.884765625, 21.65576171875, 22.4267578125, 23.19775390625, 23.96875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 5.0, 8.0, 8.0, 8.0, 7.0, 15.0, 16.0, 28.0, 29.0, 19.0, 34.0, 33.0, 35.0, 39.0, 39.0, 49.0, 30.0, 46.0, 32.0, 49.0, 41.0, 48.0, 51.0, 34.0, 41.0, 23.0, 37.0, 27.0, 25.0, 29.0, 13.0, 19.0, 14.0, 15.0, 7.0, 13.0, 10.0, 11.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.609375, -16.060302734375, -15.51123046875, -14.962158203125, -14.4130859375, -13.864013671875, -13.31494140625, -12.765869140625, -12.216796875, -11.667724609375, -11.11865234375, -10.569580078125, -10.0205078125, -9.471435546875, -8.92236328125, -8.373291015625, -7.82421875, -7.275146484375, -6.72607421875, -6.177001953125, -5.6279296875, -5.078857421875, -4.52978515625, -3.980712890625, -3.431640625, -2.882568359375, -2.33349609375, -1.784423828125, -1.2353515625, -0.686279296875, -0.13720703125, 0.411865234375, 0.9609375, 1.510009765625, 2.05908203125, 2.608154296875, 3.1572265625, 3.706298828125, 4.25537109375, 4.804443359375, 5.353515625, 5.902587890625, 6.45166015625, 7.000732421875, 7.5498046875, 8.098876953125, 8.64794921875, 9.197021484375, 9.74609375, 10.295166015625, 10.84423828125, 11.393310546875, 11.9423828125, 12.491455078125, 13.04052734375, 13.589599609375, 14.138671875, 14.687744140625, 15.23681640625, 15.785888671875, 16.3349609375, 16.884033203125, 17.43310546875, 17.982177734375, 18.53125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 9.0, 11.0, 10.0, 20.0, 27.0, 34.0, 62.0, 86.0, 130.0, 183.0, 231.0, 395.0, 619.0, 1006.0, 1840.0, 3099.0, 6069.0, 12690.0, 27234.0, 59602.0, 121533.0, 207617.0, 243011.0, 178878.0, 96526.0, 45742.0, 20750.0, 9780.0, 4882.0, 2525.0, 1404.0, 832.0, 540.0, 360.0, 220.0, 161.0, 101.0, 89.0, 54.0, 46.0, 29.0, 30.0, 19.0, 13.0, 14.0, 6.0, 8.0, 7.0, 1.0, 0.0, 4.0, 0.0, 2.0], "bins": [-11.9453125, -11.5869140625, -11.228515625, -10.8701171875, -10.51171875, -10.1533203125, -9.794921875, -9.4365234375, -9.078125, -8.7197265625, -8.361328125, -8.0029296875, -7.64453125, -7.2861328125, -6.927734375, -6.5693359375, -6.2109375, -5.8525390625, -5.494140625, -5.1357421875, -4.77734375, -4.4189453125, -4.060546875, -3.7021484375, -3.34375, -2.9853515625, -2.626953125, -2.2685546875, -1.91015625, -1.5517578125, -1.193359375, -0.8349609375, -0.4765625, -0.1181640625, 0.240234375, 0.5986328125, 0.95703125, 1.3154296875, 1.673828125, 2.0322265625, 2.390625, 2.7490234375, 3.107421875, 3.4658203125, 3.82421875, 4.1826171875, 4.541015625, 4.8994140625, 5.2578125, 5.6162109375, 5.974609375, 6.3330078125, 6.69140625, 7.0498046875, 7.408203125, 7.7666015625, 8.125, 8.4833984375, 8.841796875, 9.2001953125, 9.55859375, 9.9169921875, 10.275390625, 10.6337890625, 10.9921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 7.0, 5.0, 4.0, 9.0, 11.0, 16.0, 22.0, 29.0, 44.0, 43.0, 57.0, 52.0, 55.0, 52.0, 66.0, 68.0, 62.0, 68.0, 62.0, 59.0, 50.0, 34.0, 28.0, 27.0, 19.0, 15.0, 15.0, 8.0, 4.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005707740783691406, -0.0005525946617126465, -0.0005344152450561523, -0.0005162358283996582, -0.0004980564117431641, -0.0004798769950866699, -0.0004616975784301758, -0.00044351816177368164, -0.0004253387451171875, -0.00040715932846069336, -0.0003889799118041992, -0.0003708004951477051, -0.00035262107849121094, -0.0003344416618347168, -0.00031626224517822266, -0.0002980828285217285, -0.0002799034118652344, -0.00026172399520874023, -0.0002435445785522461, -0.00022536516189575195, -0.0002071857452392578, -0.00018900632858276367, -0.00017082691192626953, -0.0001526474952697754, -0.00013446807861328125, -0.00011628866195678711, -9.810924530029297e-05, -7.992982864379883e-05, -6.175041198730469e-05, -4.357099533081055e-05, -2.5391578674316406e-05, -7.212162017822266e-06, 1.0967254638671875e-05, 2.9146671295166016e-05, 4.7326087951660156e-05, 6.55055046081543e-05, 8.368492126464844e-05, 0.00010186433792114258, 0.00012004375457763672, 0.00013822317123413086, 0.000156402587890625, 0.00017458200454711914, 0.00019276142120361328, 0.00021094083786010742, 0.00022912025451660156, 0.0002472996711730957, 0.00026547908782958984, 0.000283658504486084, 0.0003018379211425781, 0.00032001733779907227, 0.0003381967544555664, 0.00035637617111206055, 0.0003745555877685547, 0.00039273500442504883, 0.00041091442108154297, 0.0004290938377380371, 0.00044727325439453125, 0.0004654526710510254, 0.00048363208770751953, 0.0005018115043640137, 0.0005199909210205078, 0.000538170337677002, 0.0005563497543334961, 0.0005745291709899902, 0.0005927085876464844]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 6.0, 8.0, 17.0, 15.0, 21.0, 27.0, 37.0, 65.0, 97.0, 111.0, 181.0, 286.0, 495.0, 782.0, 1436.0, 2784.0, 6036.0, 13986.0, 35078.0, 85025.0, 179470.0, 265619.0, 232787.0, 128516.0, 55467.0, 22312.0, 9052.0, 4180.0, 1940.0, 1036.0, 566.0, 334.0, 233.0, 160.0, 109.0, 90.0, 48.0, 34.0, 28.0, 21.0, 10.0, 11.0, 7.0, 6.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.764892578125, -14.23291015625, -13.700927734375, -13.1689453125, -12.636962890625, -12.10498046875, -11.572998046875, -11.041015625, -10.509033203125, -9.97705078125, -9.445068359375, -8.9130859375, -8.381103515625, -7.84912109375, -7.317138671875, -6.78515625, -6.253173828125, -5.72119140625, -5.189208984375, -4.6572265625, -4.125244140625, -3.59326171875, -3.061279296875, -2.529296875, -1.997314453125, -1.46533203125, -0.933349609375, -0.4013671875, 0.130615234375, 0.66259765625, 1.194580078125, 1.7265625, 2.258544921875, 2.79052734375, 3.322509765625, 3.8544921875, 4.386474609375, 4.91845703125, 5.450439453125, 5.982421875, 6.514404296875, 7.04638671875, 7.578369140625, 8.1103515625, 8.642333984375, 9.17431640625, 9.706298828125, 10.23828125, 10.770263671875, 11.30224609375, 11.834228515625, 12.3662109375, 12.898193359375, 13.43017578125, 13.962158203125, 14.494140625, 15.026123046875, 15.55810546875, 16.090087890625, 16.6220703125, 17.154052734375, 17.68603515625, 18.218017578125, 18.75]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 10.0, 10.0, 15.0, 12.0, 19.0, 24.0, 30.0, 26.0, 48.0, 55.0, 67.0, 71.0, 66.0, 71.0, 70.0, 74.0, 54.0, 57.0, 49.0, 36.0, 30.0, 28.0, 24.0, 19.0, 6.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.069580078125, -3.90478515625, -3.739990234375, -3.5751953125, -3.410400390625, -3.24560546875, -3.080810546875, -2.916015625, -2.751220703125, -2.58642578125, -2.421630859375, -2.2568359375, -2.092041015625, -1.92724609375, -1.762451171875, -1.59765625, -1.432861328125, -1.26806640625, -1.103271484375, -0.9384765625, -0.773681640625, -0.60888671875, -0.444091796875, -0.279296875, -0.114501953125, 0.05029296875, 0.215087890625, 0.3798828125, 0.544677734375, 0.70947265625, 0.874267578125, 1.0390625, 1.203857421875, 1.36865234375, 1.533447265625, 1.6982421875, 1.863037109375, 2.02783203125, 2.192626953125, 2.357421875, 2.522216796875, 2.68701171875, 2.851806640625, 3.0166015625, 3.181396484375, 3.34619140625, 3.510986328125, 3.67578125, 3.840576171875, 4.00537109375, 4.170166015625, 4.3349609375, 4.499755859375, 4.66455078125, 4.829345703125, 4.994140625, 5.158935546875, 5.32373046875, 5.488525390625, 5.6533203125, 5.818115234375, 5.98291015625, 6.147705078125, 6.3125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 5.0, 4.0, 6.0, 3.0, 9.0, 5.0, 11.0, 11.0, 13.0, 14.0, 19.0, 27.0, 24.0, 38.0, 31.0, 42.0, 42.0, 37.0, 43.0, 51.0, 37.0, 45.0, 45.0, 50.0, 47.0, 27.0, 36.0, 40.0, 23.0, 37.0, 17.0, 28.0, 24.0, 18.0, 13.0, 18.0, 14.0, 9.0, 15.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.167091369628906, -25.39385414123535, -24.62061882019043, -23.847381591796875, -23.074146270751953, -22.3009090423584, -21.527673721313477, -20.754436492919922, -19.981201171875, -19.207963943481445, -18.434728622436523, -17.66149139404297, -16.888256072998047, -16.115018844604492, -15.34178352355957, -14.568546295166016, -13.795310020446777, -13.022073745727539, -12.2488374710083, -11.475601196289062, -10.702364921569824, -9.929128646850586, -9.155891418457031, -8.38265609741211, -7.609419345855713, -6.836183071136475, -6.062946796417236, -5.28971004486084, -4.516473770141602, -3.7432377338409424, -2.970001220703125, -2.1967649459838867, -1.4235286712646484, -0.6502923369407654, 0.12294399738311768, 0.8961803913116455, 1.6694166660308838, 2.442652940750122, 3.2158894538879395, 3.9891257286071777, 4.762362003326416, 5.535598278045654, 6.308834552764893, 7.082071304321289, 7.855307579040527, 8.628543853759766, 9.401780128479004, 10.175016403198242, 10.94825267791748, 11.721488952636719, 12.494725227355957, 13.267961502075195, 14.041197776794434, 14.814434051513672, 15.587671279907227, 16.36090660095215, 17.134143829345703, 17.907381057739258, 18.68061637878418, 19.453853607177734, 20.227088928222656, 21.00032615661621, 21.773561477661133, 22.546798706054688, 23.32003402709961]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 8.0, 7.0, 7.0, 10.0, 16.0, 14.0, 15.0, 23.0, 20.0, 23.0, 30.0, 28.0, 28.0, 31.0, 31.0, 38.0, 45.0, 38.0, 32.0, 43.0, 41.0, 40.0, 40.0, 49.0, 37.0, 40.0, 41.0, 32.0, 33.0, 25.0, 20.0, 24.0, 17.0, 17.0, 9.0, 8.0, 11.0, 7.0, 8.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-26.76115608215332, -25.968358993530273, -25.175559997558594, -24.382762908935547, -23.5899658203125, -22.79716682434082, -22.004369735717773, -21.211570739746094, -20.418773651123047, -19.6259765625, -18.83317756652832, -18.040380477905273, -17.247583389282227, -16.454784393310547, -15.6619873046875, -14.869189262390137, -14.07639217376709, -13.283594131469727, -12.49079704284668, -11.697999000549316, -10.905200958251953, -10.112403869628906, -9.319605827331543, -8.52680778503418, -7.734010219573975, -6.9412126541137695, -6.148414611816406, -5.355617046356201, -4.562819480895996, -3.770021438598633, -2.9772238731384277, -2.1844258308410645, -1.3916282653808594, -0.59883052110672, 0.19396722316741943, 0.9867649078369141, 1.7795627117156982, 2.5723605155944824, 3.3651580810546875, 4.157956123352051, 4.950753688812256, 5.743551254272461, 6.536349296569824, 7.329146862030029, 8.121944427490234, 8.914742469787598, 9.707540512084961, 10.500337600708008, 11.293135643005371, 12.085933685302734, 12.878730773925781, 13.671528816223145, 14.464326858520508, 15.257123947143555, 16.049922943115234, 16.84272003173828, 17.635517120361328, 18.428314208984375, 19.221113204956055, 20.0139102935791, 20.80670738220215, 21.599506378173828, 22.392303466796875, 23.185100555419922, 23.9778995513916]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 14.0, 17.0, 29.0, 56.0, 95.0, 176.0, 232.0, 364.0, 582.0, 928.0, 1379.0, 2169.0, 3466.0, 5365.0, 8122.0, 12753.0, 19295.0, 28341.0, 40491.0, 56435.0, 73880.0, 90355.0, 104036.0, 109316.0, 106855.0, 96702.0, 80628.0, 62678.0, 46290.0, 32736.0, 22349.0, 14970.0, 9874.0, 6337.0, 4069.0, 2589.0, 1674.0, 1089.0, 664.0, 420.0, 258.0, 184.0, 113.0, 60.0, 42.0, 24.0, 26.0, 7.0, 12.0, 6.0, 1.0, 4.0, 1.0, 1.0], "bins": [-15.9296875, -15.4569091796875, -14.984130859375, -14.5113525390625, -14.03857421875, -13.5657958984375, -13.093017578125, -12.6202392578125, -12.1474609375, -11.6746826171875, -11.201904296875, -10.7291259765625, -10.25634765625, -9.7835693359375, -9.310791015625, -8.8380126953125, -8.365234375, -7.8924560546875, -7.419677734375, -6.9468994140625, -6.47412109375, -6.0013427734375, -5.528564453125, -5.0557861328125, -4.5830078125, -4.1102294921875, -3.637451171875, -3.1646728515625, -2.69189453125, -2.2191162109375, -1.746337890625, -1.2735595703125, -0.80078125, -0.3280029296875, 0.144775390625, 0.6175537109375, 1.09033203125, 1.5631103515625, 2.035888671875, 2.5086669921875, 2.9814453125, 3.4542236328125, 3.927001953125, 4.3997802734375, 4.87255859375, 5.3453369140625, 5.818115234375, 6.2908935546875, 6.763671875, 7.2364501953125, 7.709228515625, 8.1820068359375, 8.65478515625, 9.1275634765625, 9.600341796875, 10.0731201171875, 10.5458984375, 11.0186767578125, 11.491455078125, 11.9642333984375, 12.43701171875, 12.9097900390625, 13.382568359375, 13.8553466796875, 14.328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 7.0, 4.0, 7.0, 7.0, 11.0, 12.0, 22.0, 19.0, 24.0, 28.0, 29.0, 21.0, 29.0, 34.0, 36.0, 30.0, 39.0, 29.0, 40.0, 44.0, 42.0, 30.0, 40.0, 43.0, 52.0, 50.0, 30.0, 32.0, 26.0, 28.0, 23.0, 32.0, 14.0, 12.0, 13.0, 9.0, 14.0, 4.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0], "bins": [-27.609375, -26.84326171875, -26.0771484375, -25.31103515625, -24.544921875, -23.77880859375, -23.0126953125, -22.24658203125, -21.48046875, -20.71435546875, -19.9482421875, -19.18212890625, -18.416015625, -17.64990234375, -16.8837890625, -16.11767578125, -15.3515625, -14.58544921875, -13.8193359375, -13.05322265625, -12.287109375, -11.52099609375, -10.7548828125, -9.98876953125, -9.22265625, -8.45654296875, -7.6904296875, -6.92431640625, -6.158203125, -5.39208984375, -4.6259765625, -3.85986328125, -3.09375, -2.32763671875, -1.5615234375, -0.79541015625, -0.029296875, 0.73681640625, 1.5029296875, 2.26904296875, 3.03515625, 3.80126953125, 4.5673828125, 5.33349609375, 6.099609375, 6.86572265625, 7.6318359375, 8.39794921875, 9.1640625, 9.93017578125, 10.6962890625, 11.46240234375, 12.228515625, 12.99462890625, 13.7607421875, 14.52685546875, 15.29296875, 16.05908203125, 16.8251953125, 17.59130859375, 18.357421875, 19.12353515625, 19.8896484375, 20.65576171875, 21.421875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 10.0, 7.0, 11.0, 21.0, 38.0, 58.0, 63.0, 97.0, 136.0, 247.0, 406.0, 589.0, 959.0, 1435.0, 2199.0, 3262.0, 5001.0, 7482.0, 10989.0, 16615.0, 23658.0, 33595.0, 45404.0, 59843.0, 75083.0, 88748.0, 99304.0, 101935.0, 98326.0, 88346.0, 74747.0, 59450.0, 45487.0, 32779.0, 23120.0, 16306.0, 11062.0, 7514.0, 4922.0, 3277.0, 2014.0, 1389.0, 928.0, 573.0, 388.0, 259.0, 170.0, 131.0, 63.0, 42.0, 26.0, 11.0, 15.0, 8.0, 8.0, 5.0, 2.0, 2.0, 3.0], "bins": [-16.265625, -15.764892578125, -15.26416015625, -14.763427734375, -14.2626953125, -13.761962890625, -13.26123046875, -12.760498046875, -12.259765625, -11.759033203125, -11.25830078125, -10.757568359375, -10.2568359375, -9.756103515625, -9.25537109375, -8.754638671875, -8.25390625, -7.753173828125, -7.25244140625, -6.751708984375, -6.2509765625, -5.750244140625, -5.24951171875, -4.748779296875, -4.248046875, -3.747314453125, -3.24658203125, -2.745849609375, -2.2451171875, -1.744384765625, -1.24365234375, -0.742919921875, -0.2421875, 0.258544921875, 0.75927734375, 1.260009765625, 1.7607421875, 2.261474609375, 2.76220703125, 3.262939453125, 3.763671875, 4.264404296875, 4.76513671875, 5.265869140625, 5.7666015625, 6.267333984375, 6.76806640625, 7.268798828125, 7.76953125, 8.270263671875, 8.77099609375, 9.271728515625, 9.7724609375, 10.273193359375, 10.77392578125, 11.274658203125, 11.775390625, 12.276123046875, 12.77685546875, 13.277587890625, 13.7783203125, 14.279052734375, 14.77978515625, 15.280517578125, 15.78125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 9.0, 21.0, 16.0, 24.0, 19.0, 27.0, 24.0, 40.0, 38.0, 48.0, 38.0, 48.0, 46.0, 38.0, 58.0, 50.0, 53.0, 42.0, 44.0, 45.0, 46.0, 32.0, 22.0, 29.0, 17.0, 25.0, 15.0, 17.0, 11.0, 10.0, 10.0, 3.0, 6.0, 10.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.6875, -17.077392578125, -16.46728515625, -15.857177734375, -15.2470703125, -14.636962890625, -14.02685546875, -13.416748046875, -12.806640625, -12.196533203125, -11.58642578125, -10.976318359375, -10.3662109375, -9.756103515625, -9.14599609375, -8.535888671875, -7.92578125, -7.315673828125, -6.70556640625, -6.095458984375, -5.4853515625, -4.875244140625, -4.26513671875, -3.655029296875, -3.044921875, -2.434814453125, -1.82470703125, -1.214599609375, -0.6044921875, 0.005615234375, 0.61572265625, 1.225830078125, 1.8359375, 2.446044921875, 3.05615234375, 3.666259765625, 4.2763671875, 4.886474609375, 5.49658203125, 6.106689453125, 6.716796875, 7.326904296875, 7.93701171875, 8.547119140625, 9.1572265625, 9.767333984375, 10.37744140625, 10.987548828125, 11.59765625, 12.207763671875, 12.81787109375, 13.427978515625, 14.0380859375, 14.648193359375, 15.25830078125, 15.868408203125, 16.478515625, 17.088623046875, 17.69873046875, 18.308837890625, 18.9189453125, 19.529052734375, 20.13916015625, 20.749267578125, 21.359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 10.0, 22.0, 23.0, 31.0, 42.0, 79.0, 109.0, 170.0, 271.0, 392.0, 647.0, 979.0, 1663.0, 2726.0, 4753.0, 8136.0, 13809.0, 24188.0, 41177.0, 66845.0, 101558.0, 137965.0, 158019.0, 150663.0, 120611.0, 84273.0, 52846.0, 31834.0, 18514.0, 10666.0, 6214.0, 3748.0, 2045.0, 1279.0, 821.0, 462.0, 340.0, 201.0, 148.0, 99.0, 58.0, 44.0, 24.0, 18.0, 12.0, 14.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.1875, -10.8560791015625, -10.524658203125, -10.1932373046875, -9.86181640625, -9.5303955078125, -9.198974609375, -8.8675537109375, -8.5361328125, -8.2047119140625, -7.873291015625, -7.5418701171875, -7.21044921875, -6.8790283203125, -6.547607421875, -6.2161865234375, -5.884765625, -5.5533447265625, -5.221923828125, -4.8905029296875, -4.55908203125, -4.2276611328125, -3.896240234375, -3.5648193359375, -3.2333984375, -2.9019775390625, -2.570556640625, -2.2391357421875, -1.90771484375, -1.5762939453125, -1.244873046875, -0.9134521484375, -0.58203125, -0.2506103515625, 0.080810546875, 0.4122314453125, 0.74365234375, 1.0750732421875, 1.406494140625, 1.7379150390625, 2.0693359375, 2.4007568359375, 2.732177734375, 3.0635986328125, 3.39501953125, 3.7264404296875, 4.057861328125, 4.3892822265625, 4.720703125, 5.0521240234375, 5.383544921875, 5.7149658203125, 6.04638671875, 6.3778076171875, 6.709228515625, 7.0406494140625, 7.3720703125, 7.7034912109375, 8.034912109375, 8.3663330078125, 8.69775390625, 9.0291748046875, 9.360595703125, 9.6920166015625, 10.0234375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 1.0, 8.0, 12.0, 16.0, 22.0, 23.0, 27.0, 42.0, 59.0, 52.0, 76.0, 72.0, 82.0, 73.0, 97.0, 57.0, 60.0, 60.0, 38.0, 40.0, 20.0, 17.0, 17.0, 6.0, 8.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013017654418945312, -0.001253172755241394, -0.0012045800685882568, -0.0011559873819351196, -0.0011073946952819824, -0.0010588020086288452, -0.001010209321975708, -0.0009616166353225708, -0.0009130239486694336, -0.0008644312620162964, -0.0008158385753631592, -0.000767245888710022, -0.0007186532020568848, -0.0006700605154037476, -0.0006214678287506104, -0.0005728751420974731, -0.0005242824554443359, -0.00047568976879119873, -0.0004270970821380615, -0.0003785043954849243, -0.0003299117088317871, -0.0002813190221786499, -0.0002327263355255127, -0.0001841336488723755, -0.00013554096221923828, -8.694827556610107e-05, -3.835558891296387e-05, 1.023709774017334e-05, 5.882978439331055e-05, 0.00010742247104644775, 0.00015601515769958496, 0.00020460784435272217, 0.0002532005310058594, 0.0003017932176589966, 0.0003503859043121338, 0.000398978590965271, 0.0004475712776184082, 0.0004961639642715454, 0.0005447566509246826, 0.0005933493375778198, 0.000641942024230957, 0.0006905347108840942, 0.0007391273975372314, 0.0007877200841903687, 0.0008363127708435059, 0.0008849054574966431, 0.0009334981441497803, 0.0009820908308029175, 0.0010306835174560547, 0.001079276204109192, 0.001127868890762329, 0.0011764615774154663, 0.0012250542640686035, 0.0012736469507217407, 0.001322239637374878, 0.0013708323240280151, 0.0014194250106811523, 0.0014680176973342896, 0.0015166103839874268, 0.001565203070640564, 0.0016137957572937012, 0.0016623884439468384, 0.0017109811305999756, 0.0017595738172531128, 0.00180816650390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 9.0, 8.0, 15.0, 20.0, 44.0, 41.0, 80.0, 112.0, 159.0, 224.0, 355.0, 580.0, 963.0, 1525.0, 2496.0, 4062.0, 6760.0, 11373.0, 18433.0, 30445.0, 48094.0, 72901.0, 102180.0, 129142.0, 142881.0, 135274.0, 111461.0, 82203.0, 55437.0, 35822.0, 21724.0, 13146.0, 8061.0, 4922.0, 2877.0, 1712.0, 1086.0, 668.0, 447.0, 276.0, 177.0, 122.0, 88.0, 47.0, 32.0, 28.0, 19.0, 14.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3984375, -9.0919189453125, -8.785400390625, -8.4788818359375, -8.17236328125, -7.8658447265625, -7.559326171875, -7.2528076171875, -6.9462890625, -6.6397705078125, -6.333251953125, -6.0267333984375, -5.72021484375, -5.4136962890625, -5.107177734375, -4.8006591796875, -4.494140625, -4.1876220703125, -3.881103515625, -3.5745849609375, -3.26806640625, -2.9615478515625, -2.655029296875, -2.3485107421875, -2.0419921875, -1.7354736328125, -1.428955078125, -1.1224365234375, -0.81591796875, -0.5093994140625, -0.202880859375, 0.1036376953125, 0.41015625, 0.7166748046875, 1.023193359375, 1.3297119140625, 1.63623046875, 1.9427490234375, 2.249267578125, 2.5557861328125, 2.8623046875, 3.1688232421875, 3.475341796875, 3.7818603515625, 4.08837890625, 4.3948974609375, 4.701416015625, 5.0079345703125, 5.314453125, 5.6209716796875, 5.927490234375, 6.2340087890625, 6.54052734375, 6.8470458984375, 7.153564453125, 7.4600830078125, 7.7666015625, 8.0731201171875, 8.379638671875, 8.6861572265625, 8.99267578125, 9.2991943359375, 9.605712890625, 9.9122314453125, 10.21875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 10.0, 8.0, 15.0, 16.0, 18.0, 26.0, 34.0, 30.0, 26.0, 42.0, 47.0, 40.0, 47.0, 49.0, 62.0, 60.0, 54.0, 50.0, 47.0, 49.0, 45.0, 42.0, 35.0, 19.0, 20.0, 24.0, 10.0, 12.0, 7.0, 6.0, 6.0, 3.0, 3.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.85546875, -3.734588623046875, -3.61370849609375, -3.492828369140625, -3.3719482421875, -3.251068115234375, -3.13018798828125, -3.009307861328125, -2.888427734375, -2.767547607421875, -2.64666748046875, -2.525787353515625, -2.4049072265625, -2.284027099609375, -2.16314697265625, -2.042266845703125, -1.92138671875, -1.800506591796875, -1.67962646484375, -1.558746337890625, -1.4378662109375, -1.316986083984375, -1.19610595703125, -1.075225830078125, -0.954345703125, -0.833465576171875, -0.71258544921875, -0.591705322265625, -0.4708251953125, -0.349945068359375, -0.22906494140625, -0.108184814453125, 0.0126953125, 0.133575439453125, 0.25445556640625, 0.375335693359375, 0.4962158203125, 0.617095947265625, 0.73797607421875, 0.858856201171875, 0.979736328125, 1.100616455078125, 1.22149658203125, 1.342376708984375, 1.4632568359375, 1.584136962890625, 1.70501708984375, 1.825897216796875, 1.94677734375, 2.067657470703125, 2.18853759765625, 2.309417724609375, 2.4302978515625, 2.551177978515625, 2.67205810546875, 2.792938232421875, 2.913818359375, 3.034698486328125, 3.15557861328125, 3.276458740234375, 3.3973388671875, 3.518218994140625, 3.63909912109375, 3.759979248046875, 3.880859375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 0.0, 4.0, 5.0, 11.0, 9.0, 10.0, 9.0, 12.0, 12.0, 15.0, 23.0, 27.0, 20.0, 26.0, 37.0, 36.0, 36.0, 50.0, 32.0, 59.0, 46.0, 44.0, 56.0, 41.0, 44.0, 31.0, 31.0, 26.0, 35.0, 19.0, 31.0, 28.0, 26.0, 18.0, 15.0, 15.0, 18.0, 3.0, 14.0, 6.0, 7.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-28.57404899597168, -27.79125213623047, -27.008453369140625, -26.22565460205078, -25.44285774230957, -24.66006088256836, -23.877262115478516, -23.094463348388672, -22.31166648864746, -21.52886962890625, -20.746070861816406, -19.963272094726562, -19.18047523498535, -18.39767837524414, -17.614879608154297, -16.832080841064453, -16.049283981323242, -15.266486167907715, -14.483688354492188, -13.70089054107666, -12.918092727661133, -12.135294914245605, -11.352497100830078, -10.56969928741455, -9.786901473999023, -9.004103660583496, -8.221305847167969, -7.438508033752441, -6.655710220336914, -5.872912406921387, -5.090114593505859, -4.307316780090332, -3.5245189666748047, -2.7417211532592773, -1.95892333984375, -1.1761255264282227, -0.3933277130126953, 0.38947010040283203, 1.1722679138183594, 1.9550657272338867, 2.737863540649414, 3.5206613540649414, 4.303459167480469, 5.086256980895996, 5.869054794311523, 6.651852607727051, 7.434650421142578, 8.217448234558105, 9.000246047973633, 9.78304386138916, 10.565841674804688, 11.348639488220215, 12.131437301635742, 12.91423511505127, 13.697032928466797, 14.479830741882324, 15.262628555297852, 16.045425415039062, 16.828224182128906, 17.61102294921875, 18.39381980895996, 19.176616668701172, 19.959415435791016, 20.74221420288086, 21.52501106262207]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 6.0, 12.0, 9.0, 13.0, 16.0, 20.0, 18.0, 32.0, 27.0, 31.0, 29.0, 35.0, 35.0, 40.0, 49.0, 34.0, 42.0, 47.0, 54.0, 41.0, 49.0, 45.0, 36.0, 29.0, 38.0, 30.0, 26.0, 24.0, 22.0, 12.0, 19.0, 15.0, 15.0, 8.0, 11.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.14990997314453, -27.194936752319336, -26.239961624145508, -25.284988403320312, -24.330015182495117, -23.375041961669922, -22.420066833496094, -21.4650936126709, -20.510120391845703, -19.555147171020508, -18.60017204284668, -17.645198822021484, -16.69022560119629, -15.735251426696777, -14.780277252197266, -13.82530403137207, -12.870329856872559, -11.915355682373047, -10.960382461547852, -10.00540828704834, -9.050435066223145, -8.095460891723633, -7.140487194061279, -6.185513496398926, -5.230539798736572, -4.275566101074219, -3.3205924034118652, -2.3656184673309326, -1.410644769668579, -0.4556708335876465, 0.49930286407470703, 1.4542765617370605, 2.409250259399414, 3.3642239570617676, 4.319197654724121, 5.274171829223633, 6.229145050048828, 7.18411922454834, 8.139093399047852, 9.094066619873047, 10.049039840698242, 11.004014015197754, 11.95898723602295, 12.913961410522461, 13.868934631347656, 14.823908805847168, 15.77888298034668, 16.733856201171875, 17.688831329345703, 18.6438045501709, 19.598779678344727, 20.553752899169922, 21.508726119995117, 22.463699340820312, 23.41867446899414, 24.373647689819336, 25.32862091064453, 26.283594131469727, 27.238569259643555, 28.19354248046875, 29.148515701293945, 30.10348892211914, 31.05846405029297, 32.01343536376953, 32.96841049194336]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 3.0, 18.0, 8.0, 10.0, 17.0, 30.0, 31.0, 42.0, 41.0, 60.0, 89.0, 109.0, 182.0, 244.0, 316.0, 495.0, 735.0, 1209.0, 1933.0, 3269.0, 6173.0, 1017118.0, 8065.0, 3942.0, 2265.0, 1414.0, 877.0, 560.0, 363.0, 233.0, 191.0, 140.0, 90.0, 79.0, 52.0, 59.0, 30.0, 29.0, 21.0, 10.0, 17.0, 8.0, 9.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-386.8968811035156, -374.68023681640625, -362.4635925292969, -350.2469482421875, -338.0303039550781, -325.81365966796875, -313.59698486328125, -301.38037109375, -289.1636962890625, -276.9470520019531, -264.73040771484375, -252.51376342773438, -240.297119140625, -228.08047485351562, -215.8638153076172, -203.6471710205078, -191.4305419921875, -179.21389770507812, -166.99725341796875, -154.78060913085938, -142.56396484375, -130.34732055664062, -118.13066101074219, -105.91401672363281, -93.69737243652344, -81.48072814941406, -69.26408386230469, -57.04743194580078, -44.830787658691406, -32.61414337158203, -20.397491455078125, -8.18084716796875, 4.0357666015625, 16.252412796020508, 28.469058990478516, 40.685707092285156, 52.90235137939453, 65.1189956665039, 77.33564758300781, 89.55229187011719, 101.76893615722656, 113.98558044433594, 126.20222473144531, 138.41888427734375, 150.63552856445312, 162.8521728515625, 175.06881713867188, 187.28546142578125, 199.50210571289062, 211.71875, 223.93539428710938, 236.15203857421875, 248.36868286132812, 260.5853271484375, 272.802001953125, 285.01861572265625, 297.23529052734375, 309.4519348144531, 321.6685791015625, 333.8852233886719, 346.10186767578125, 358.3185119628906, 370.53515625, 382.7518310546875, 394.96844482421875]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 17.0, 19.0, 30.0, 35.0, 42.0, 83.0, 112.0, 164.0, 202.0, 300.0, 380.0, 493.0, 624.0, 850.0, 1029.0, 1300.0, 1680.0, 2176.0, 2896.0, 4299.0, 7145.0, 16449.0, 224087.0, 51163432.0, 18634.0, 7597.0, 4552.0, 3058.0, 2189.0, 1699.0, 1341.0, 1069.0, 871.0, 609.0, 495.0, 387.0, 268.0, 237.0, 171.0, 93.0, 95.0, 70.0, 43.0, 30.0, 25.0, 12.0, 9.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-537.3463134765625, -521.5675048828125, -505.78863525390625, -490.0097961425781, -474.23095703125, -458.4521179199219, -442.67327880859375, -426.89447021484375, -411.1156005859375, -395.3367614746094, -379.55792236328125, -363.7790832519531, -348.000244140625, -332.2214050292969, -316.44256591796875, -300.66375732421875, -284.8849182128906, -269.1060791015625, -253.32723999023438, -237.54840087890625, -221.76956176757812, -205.99072265625, -190.21189880371094, -174.4330596923828, -158.6542205810547, -142.87538146972656, -127.09654235839844, -111.31771087646484, -95.53887176513672, -79.7600326538086, -63.981201171875, -48.202362060546875, -32.423492431640625, -16.644655227661133, -0.8658180236816406, 14.913017272949219, 30.691856384277344, 46.47069549560547, 62.24952697753906, 78.02836608886719, 93.80720520019531, 109.58604431152344, 125.36488342285156, 141.14370727539062, 156.92254638671875, 172.70138549804688, 188.480224609375, 204.25906372070312, 220.03790283203125, 235.81674194335938, 251.5955810546875, 267.3744201660156, 283.15325927734375, 298.9320983886719, 314.7109375, 330.48974609375, 346.26861572265625, 362.0474548339844, 377.8262939453125, 393.6051330566406, 409.38397216796875, 425.1628112792969, 440.941650390625, 456.720458984375, 472.4992980957031]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 11.0, 16.0, 24.0, 51.0, 48.0, 77.0, 122.0, 198.0, 294.0, 476.0, 760.0, 1215.0, 1902.0, 3002.0, 4863.0, 7764.0, 12456.0, 20614.0, 34024.0, 58659.0, 102562.0, 184849.0, 354541.0, 749986.0, 1615059.0, 1610177.0, 743795.0, 351989.0, 184271.0, 101824.0, 58280.0, 34259.0, 20373.0, 12402.0, 7658.0, 4692.0, 2864.0, 1939.0, 1216.0, 767.0, 459.0, 324.0, 179.0, 151.0, 99.0, 54.0, 41.0, 22.0, 16.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.34375, -59.22802734375, -57.1123046875, -54.99658203125, -52.880859375, -50.76513671875, -48.6494140625, -46.53369140625, -44.41796875, -42.30224609375, -40.1865234375, -38.07080078125, -35.955078125, -33.83935546875, -31.7236328125, -29.60791015625, -27.4921875, -25.37646484375, -23.2607421875, -21.14501953125, -19.029296875, -16.91357421875, -14.7978515625, -12.68212890625, -10.56640625, -8.45068359375, -6.3349609375, -4.21923828125, -2.103515625, 0.01220703125, 2.1279296875, 4.24365234375, 6.359375, 8.47509765625, 10.5908203125, 12.70654296875, 14.822265625, 16.93798828125, 19.0537109375, 21.16943359375, 23.28515625, 25.40087890625, 27.5166015625, 29.63232421875, 31.748046875, 33.86376953125, 35.9794921875, 38.09521484375, 40.2109375, 42.32666015625, 44.4423828125, 46.55810546875, 48.673828125, 50.78955078125, 52.9052734375, 55.02099609375, 57.13671875, 59.25244140625, 61.3681640625, 63.48388671875, 65.599609375, 67.71533203125, 69.8310546875, 71.94677734375, 74.0625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 14.0, 2.0, 8.0, 13.0, 8.0, 12.0, 19.0, 17.0, 21.0, 33.0, 39.0, 46.0, 56.0, 55.0, 87.0, 103.0, 159.0, 196.0, 191.0, 176.0, 170.0, 139.0, 107.0, 74.0, 54.0, 44.0, 33.0, 25.0, 13.0, 20.0, 23.0, 15.0, 9.0, 4.0, 10.0, 8.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.0625, -39.7646484375, -38.466796875, -37.1689453125, -35.87109375, -34.5732421875, -33.275390625, -31.9775390625, -30.6796875, -29.3818359375, -28.083984375, -26.7861328125, -25.48828125, -24.1904296875, -22.892578125, -21.5947265625, -20.296875, -18.9990234375, -17.701171875, -16.4033203125, -15.10546875, -13.8076171875, -12.509765625, -11.2119140625, -9.9140625, -8.6162109375, -7.318359375, -6.0205078125, -4.72265625, -3.4248046875, -2.126953125, -0.8291015625, 0.46875, 1.7666015625, 3.064453125, 4.3623046875, 5.66015625, 6.9580078125, 8.255859375, 9.5537109375, 10.8515625, 12.1494140625, 13.447265625, 14.7451171875, 16.04296875, 17.3408203125, 18.638671875, 19.9365234375, 21.234375, 22.5322265625, 23.830078125, 25.1279296875, 26.42578125, 27.7236328125, 29.021484375, 30.3193359375, 31.6171875, 32.9150390625, 34.212890625, 35.5107421875, 36.80859375, 38.1064453125, 39.404296875, 40.7021484375, 42.0]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 8.0, 12.0, 30.0, 54.0, 40.0, 86.0, 138.0, 164.0, 287.0, 403.0, 686.0, 1163.0, 1862.0, 3026.0, 4899.0, 8118.0, 12906.0, 21629.0, 35074.0, 56471.0, 91955.0, 148269.0, 242110.0, 428265.0, 1049957.0, 2172243.0, 988487.0, 413488.0, 233537.0, 144243.0, 88870.0, 55090.0, 34012.0, 20698.0, 12627.0, 7919.0, 4819.0, 2982.0, 1733.0, 1144.0, 719.0, 423.0, 280.0, 184.0, 116.0, 77.0, 47.0, 33.0, 21.0, 13.0, 12.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-36.0625, -34.87890625, -33.6953125, -32.51171875, -31.328125, -30.14453125, -28.9609375, -27.77734375, -26.59375, -25.41015625, -24.2265625, -23.04296875, -21.859375, -20.67578125, -19.4921875, -18.30859375, -17.125, -15.94140625, -14.7578125, -13.57421875, -12.390625, -11.20703125, -10.0234375, -8.83984375, -7.65625, -6.47265625, -5.2890625, -4.10546875, -2.921875, -1.73828125, -0.5546875, 0.62890625, 1.8125, 2.99609375, 4.1796875, 5.36328125, 6.546875, 7.73046875, 8.9140625, 10.09765625, 11.28125, 12.46484375, 13.6484375, 14.83203125, 16.015625, 17.19921875, 18.3828125, 19.56640625, 20.75, 21.93359375, 23.1171875, 24.30078125, 25.484375, 26.66796875, 27.8515625, 29.03515625, 30.21875, 31.40234375, 32.5859375, 33.76953125, 34.953125, 36.13671875, 37.3203125, 38.50390625, 39.6875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 8.0, 6.0, 8.0, 9.0, 9.0, 11.0, 18.0, 21.0, 23.0, 31.0, 47.0, 48.0, 60.0, 77.0, 116.0, 204.0, 326.0, 294.0, 193.0, 130.0, 77.0, 51.0, 49.0, 48.0, 23.0, 24.0, 21.0, 21.0, 11.0, 14.0, 12.0, 6.0, 7.0, 5.0, 0.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.90625, -57.90478515625, -55.9033203125, -53.90185546875, -51.900390625, -49.89892578125, -47.8974609375, -45.89599609375, -43.89453125, -41.89306640625, -39.8916015625, -37.89013671875, -35.888671875, -33.88720703125, -31.8857421875, -29.88427734375, -27.8828125, -25.88134765625, -23.8798828125, -21.87841796875, -19.876953125, -17.87548828125, -15.8740234375, -13.87255859375, -11.87109375, -9.86962890625, -7.8681640625, -5.86669921875, -3.865234375, -1.86376953125, 0.1376953125, 2.13916015625, 4.140625, 6.14208984375, 8.1435546875, 10.14501953125, 12.146484375, 14.14794921875, 16.1494140625, 18.15087890625, 20.15234375, 22.15380859375, 24.1552734375, 26.15673828125, 28.158203125, 30.15966796875, 32.1611328125, 34.16259765625, 36.1640625, 38.16552734375, 40.1669921875, 42.16845703125, 44.169921875, 46.17138671875, 48.1728515625, 50.17431640625, 52.17578125, 54.17724609375, 56.1787109375, 58.18017578125, 60.181640625, 62.18310546875, 64.1845703125, 66.18603515625, 68.1875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 13.0, 24.0, 32.0, 38.0, 66.0, 107.0, 135.0, 210.0, 344.0, 573.0, 913.0, 1640.0, 2976.0, 5554.0, 10394.0, 19349.0, 36654.0, 72488.0, 192352.0, 5591775.0, 202148.0, 73578.0, 37120.0, 19425.0, 10387.0, 5606.0, 3107.0, 1770.0, 1030.0, 584.0, 384.0, 249.0, 152.0, 94.0, 56.0, 31.0, 20.0, 17.0, 9.0, 9.0, 3.0, 2.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-108.875, -105.720703125, -102.56640625, -99.412109375, -96.2578125, -93.103515625, -89.94921875, -86.794921875, -83.640625, -80.486328125, -77.33203125, -74.177734375, -71.0234375, -67.869140625, -64.71484375, -61.560546875, -58.40625, -55.251953125, -52.09765625, -48.943359375, -45.7890625, -42.634765625, -39.48046875, -36.326171875, -33.171875, -30.017578125, -26.86328125, -23.708984375, -20.5546875, -17.400390625, -14.24609375, -11.091796875, -7.9375, -4.783203125, -1.62890625, 1.525390625, 4.6796875, 7.833984375, 10.98828125, 14.142578125, 17.296875, 20.451171875, 23.60546875, 26.759765625, 29.9140625, 33.068359375, 36.22265625, 39.376953125, 42.53125, 45.685546875, 48.83984375, 51.994140625, 55.1484375, 58.302734375, 61.45703125, 64.611328125, 67.765625, 70.919921875, 74.07421875, 77.228515625, 80.3828125, 83.537109375, 86.69140625, 89.845703125, 93.0]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 4.0, 8.0, 11.0, 11.0, 12.0, 10.0, 11.0, 15.0, 20.0, 28.0, 30.0, 35.0, 28.0, 46.0, 41.0, 46.0, 73.0, 166.0, 296.0, 330.0, 242.0, 114.0, 63.0, 58.0, 43.0, 39.0, 28.0, 33.0, 22.0, 23.0, 35.0, 17.0, 15.0, 11.0, 13.0, 8.0, 11.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.3125, -80.5615234375, -77.810546875, -75.0595703125, -72.30859375, -69.5576171875, -66.806640625, -64.0556640625, -61.3046875, -58.5537109375, -55.802734375, -53.0517578125, -50.30078125, -47.5498046875, -44.798828125, -42.0478515625, -39.296875, -36.5458984375, -33.794921875, -31.0439453125, -28.29296875, -25.5419921875, -22.791015625, -20.0400390625, -17.2890625, -14.5380859375, -11.787109375, -9.0361328125, -6.28515625, -3.5341796875, -0.783203125, 1.9677734375, 4.71875, 7.4697265625, 10.220703125, 12.9716796875, 15.72265625, 18.4736328125, 21.224609375, 23.9755859375, 26.7265625, 29.4775390625, 32.228515625, 34.9794921875, 37.73046875, 40.4814453125, 43.232421875, 45.9833984375, 48.734375, 51.4853515625, 54.236328125, 56.9873046875, 59.73828125, 62.4892578125, 65.240234375, 67.9912109375, 70.7421875, 73.4931640625, 76.244140625, 78.9951171875, 81.74609375, 84.4970703125, 87.248046875, 89.9990234375, 92.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 13.0, 10.0, 18.0, 30.0, 43.0, 49.0, 61.0, 91.0, 135.0, 176.0, 113.0, 61.0, 51.0, 30.0, 29.0, 28.0, 13.0, 8.0, 11.0, 10.0, 3.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2196.351318359375, -2126.36474609375, -2056.3779296875, -1986.391357421875, -1916.4046630859375, -1846.41796875, -1776.431396484375, -1706.4447021484375, -1636.4580078125, -1566.4713134765625, -1496.4847412109375, -1426.498046875, -1356.5113525390625, -1286.524658203125, -1216.5380859375, -1146.5513916015625, -1076.5648193359375, -1006.5781860351562, -936.5914916992188, -866.6048583984375, -796.6181640625, -726.6315307617188, -656.6448974609375, -586.658203125, -516.6715698242188, -446.6849060058594, -376.6982421875, -306.71160888671875, -236.72494506835938, -166.73828125, -96.75164794921875, -26.764984130859375, 43.2216796875, 113.20833587646484, 183.1949920654297, 253.181640625, 323.1683044433594, 393.15496826171875, 463.1416015625, 533.1282958984375, 603.1149291992188, 673.1015625, 743.0882568359375, 813.0748901367188, 883.0615234375, 953.0482177734375, 1023.0348510742188, 1093.021484375, 1163.0081787109375, 1232.994873046875, 1302.9814453125, 1372.9681396484375, 1442.954833984375, 1512.94140625, 1582.9281005859375, 1652.914794921875, 1722.9013671875, 1792.8880615234375, 1862.8746337890625, 1932.861328125, 2002.8480224609375, 2072.834716796875, 2142.8212890625, 2212.807861328125, 2282.794677734375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 7.0, 5.0, 12.0, 14.0, 11.0, 14.0, 26.0, 23.0, 28.0, 32.0, 32.0, 42.0, 62.0, 99.0, 128.0, 97.0, 66.0, 56.0, 43.0, 37.0, 15.0, 22.0, 28.0, 21.0, 16.0, 14.0, 10.0, 15.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2089.05224609375, -2023.41552734375, -1957.7786865234375, -1892.1419677734375, -1826.505126953125, -1760.868408203125, -1695.231689453125, -1629.594970703125, -1563.9581298828125, -1498.3214111328125, -1432.6845703125, -1367.0478515625, -1301.4111328125, -1235.7742919921875, -1170.1375732421875, -1104.500732421875, -1038.864013671875, -973.2272338867188, -907.5904541015625, -841.9537353515625, -776.3169555664062, -710.68017578125, -645.04345703125, -579.4066772460938, -513.7698974609375, -448.13311767578125, -382.4963684082031, -316.859619140625, -251.22283935546875, -185.5860595703125, -119.94931030273438, -54.31256103515625, 11.32421875, 76.96098327636719, 142.59774780273438, 208.23451232910156, 273.87127685546875, 339.508056640625, 405.1448059082031, 470.78155517578125, 536.4183349609375, 602.0551147460938, 667.69189453125, 733.32861328125, 798.9653930664062, 864.6021728515625, 930.2388916015625, 995.8756713867188, 1061.512451171875, 1127.149169921875, 1192.7860107421875, 1258.4227294921875, 1324.0595703125, 1389.6962890625, 1455.3330078125, 1520.9697265625, 1586.6065673828125, 1652.2432861328125, 1717.880126953125, 1783.516845703125, 1849.153564453125, 1914.7904052734375, 1980.4271240234375, 2046.06396484375, 2111.70068359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 11.0, 14.0, 22.0, 32.0, 39.0, 43.0, 97.0, 137.0, 230.0, 360.0, 577.0, 984.0, 1763.0, 2949.0, 5569.0, 10788.0, 23874.0, 70588.0, 398752.0, 3289919.0, 285226.0, 57991.0, 21490.0, 10036.0, 5295.0, 2892.0, 1732.0, 1007.0, 656.0, 376.0, 247.0, 181.0, 130.0, 83.0, 70.0, 38.0, 21.0, 15.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.1119384765625, -11.700439453125, -11.2889404296875, -10.87744140625, -10.4659423828125, -10.054443359375, -9.6429443359375, -9.2314453125, -8.8199462890625, -8.408447265625, -7.9969482421875, -7.58544921875, -7.1739501953125, -6.762451171875, -6.3509521484375, -5.939453125, -5.5279541015625, -5.116455078125, -4.7049560546875, -4.29345703125, -3.8819580078125, -3.470458984375, -3.0589599609375, -2.6474609375, -2.2359619140625, -1.824462890625, -1.4129638671875, -1.00146484375, -0.5899658203125, -0.178466796875, 0.2330322265625, 0.64453125, 1.0560302734375, 1.467529296875, 1.8790283203125, 2.29052734375, 2.7020263671875, 3.113525390625, 3.5250244140625, 3.9365234375, 4.3480224609375, 4.759521484375, 5.1710205078125, 5.58251953125, 5.9940185546875, 6.405517578125, 6.8170166015625, 7.228515625, 7.6400146484375, 8.051513671875, 8.4630126953125, 8.87451171875, 9.2860107421875, 9.697509765625, 10.1090087890625, 10.5205078125, 10.9320068359375, 11.343505859375, 11.7550048828125, 12.16650390625, 12.5780029296875, 12.989501953125, 13.4010009765625, 13.8125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 2.0, 9.0, 7.0, 8.0, 9.0, 15.0, 28.0, 50.0, 66.0, 98.0, 140.0, 169.0, 113.0, 83.0, 67.0, 37.0, 24.0, 8.0, 14.0, 6.0, 2.0, 1.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.15802001953125, -2.0914306640625, -2.02484130859375, -1.958251953125, -1.89166259765625, -1.8250732421875, -1.75848388671875, -1.69189453125, -1.62530517578125, -1.5587158203125, -1.49212646484375, -1.425537109375, -1.35894775390625, -1.2923583984375, -1.22576904296875, -1.1591796875, -1.09259033203125, -1.0260009765625, -0.95941162109375, -0.892822265625, -0.82623291015625, -0.7596435546875, -0.69305419921875, -0.62646484375, -0.55987548828125, -0.4932861328125, -0.42669677734375, -0.360107421875, -0.29351806640625, -0.2269287109375, -0.16033935546875, -0.09375, -0.02716064453125, 0.0394287109375, 0.10601806640625, 0.172607421875, 0.23919677734375, 0.3057861328125, 0.37237548828125, 0.43896484375, 0.50555419921875, 0.5721435546875, 0.63873291015625, 0.705322265625, 0.77191162109375, 0.8385009765625, 0.90509033203125, 0.9716796875, 1.03826904296875, 1.1048583984375, 1.17144775390625, 1.238037109375, 1.30462646484375, 1.3712158203125, 1.43780517578125, 1.50439453125, 1.57098388671875, 1.6375732421875, 1.70416259765625, 1.770751953125, 1.83734130859375, 1.9039306640625, 1.97052001953125, 2.037109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 19.0, 11.0, 26.0, 35.0, 57.0, 96.0, 155.0, 208.0, 376.0, 653.0, 1028.0, 1993.0, 3505.0, 6813.0, 14246.0, 31626.0, 76637.0, 211754.0, 710720.0, 2104556.0, 688145.0, 206752.0, 75385.0, 30773.0, 13784.0, 6713.0, 3499.0, 1950.0, 1052.0, 620.0, 347.0, 253.0, 157.0, 93.0, 66.0, 42.0, 37.0, 29.0, 17.0, 11.0, 12.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.046875, -8.7501220703125, -8.453369140625, -8.1566162109375, -7.85986328125, -7.5631103515625, -7.266357421875, -6.9696044921875, -6.6728515625, -6.3760986328125, -6.079345703125, -5.7825927734375, -5.48583984375, -5.1890869140625, -4.892333984375, -4.5955810546875, -4.298828125, -4.0020751953125, -3.705322265625, -3.4085693359375, -3.11181640625, -2.8150634765625, -2.518310546875, -2.2215576171875, -1.9248046875, -1.6280517578125, -1.331298828125, -1.0345458984375, -0.73779296875, -0.4410400390625, -0.144287109375, 0.1524658203125, 0.44921875, 0.7459716796875, 1.042724609375, 1.3394775390625, 1.63623046875, 1.9329833984375, 2.229736328125, 2.5264892578125, 2.8232421875, 3.1199951171875, 3.416748046875, 3.7135009765625, 4.01025390625, 4.3070068359375, 4.603759765625, 4.9005126953125, 5.197265625, 5.4940185546875, 5.790771484375, 6.0875244140625, 6.38427734375, 6.6810302734375, 6.977783203125, 7.2745361328125, 7.5712890625, 7.8680419921875, 8.164794921875, 8.4615478515625, 8.75830078125, 9.0550537109375, 9.351806640625, 9.6485595703125, 9.9453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 7.0, 7.0, 13.0, 15.0, 22.0, 35.0, 31.0, 52.0, 60.0, 88.0, 105.0, 151.0, 213.0, 324.0, 459.0, 764.0, 524.0, 332.0, 230.0, 154.0, 135.0, 89.0, 67.0, 49.0, 28.0, 25.0, 24.0, 21.0, 12.0, 12.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83203125, -3.69287109375, -3.5537109375, -3.41455078125, -3.275390625, -3.13623046875, -2.9970703125, -2.85791015625, -2.71875, -2.57958984375, -2.4404296875, -2.30126953125, -2.162109375, -2.02294921875, -1.8837890625, -1.74462890625, -1.60546875, -1.46630859375, -1.3271484375, -1.18798828125, -1.048828125, -0.90966796875, -0.7705078125, -0.63134765625, -0.4921875, -0.35302734375, -0.2138671875, -0.07470703125, 0.064453125, 0.20361328125, 0.3427734375, 0.48193359375, 0.62109375, 0.76025390625, 0.8994140625, 1.03857421875, 1.177734375, 1.31689453125, 1.4560546875, 1.59521484375, 1.734375, 1.87353515625, 2.0126953125, 2.15185546875, 2.291015625, 2.43017578125, 2.5693359375, 2.70849609375, 2.84765625, 2.98681640625, 3.1259765625, 3.26513671875, 3.404296875, 3.54345703125, 3.6826171875, 3.82177734375, 3.9609375, 4.10009765625, 4.2392578125, 4.37841796875, 4.517578125, 4.65673828125, 4.7958984375, 4.93505859375, 5.07421875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 10.0, 11.0, 21.0, 33.0, 37.0, 79.0, 98.0, 135.0, 133.0, 149.0, 88.0, 78.0, 50.0, 27.0, 25.0, 5.0, 11.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.77008056640625, -48.440250396728516, -47.11042022705078, -45.78059387207031, -44.45076370239258, -43.120933532714844, -41.79110336303711, -40.461273193359375, -39.131446838378906, -37.80161666870117, -36.47178649902344, -35.14196014404297, -33.812129974365234, -32.4822998046875, -31.152469635009766, -29.82263946533203, -28.492809295654297, -27.162979125976562, -25.83315086364746, -24.503320693969727, -23.173492431640625, -21.84366226196289, -20.513832092285156, -19.184001922607422, -17.85417366027832, -16.524343490600586, -15.194515228271484, -13.86468505859375, -12.534855842590332, -11.205026626586914, -9.87519645690918, -8.545367240905762, -7.215541839599609, -5.885712623596191, -4.555882930755615, -3.226053476333618, -1.896224021911621, -0.5663948059082031, 0.763434886932373, 2.093264579772949, 3.423093795776367, 4.752923011779785, 6.082752704620361, 7.4125823974609375, 8.742411613464355, 10.072240829467773, 11.402070999145508, 12.731900215148926, 14.061729431152344, 15.391558647155762, 16.72138786315918, 18.051218032836914, 19.381046295166016, 20.71087646484375, 22.040706634521484, 23.37053680419922, 24.70036506652832, 26.030195236206055, 27.360023498535156, 28.68985366821289, 30.019683837890625, 31.349512100219727, 32.67934036254883, 34.00917053222656, 35.3390007019043]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 6.0, 8.0, 15.0, 16.0, 5.0, 12.0, 26.0, 27.0, 28.0, 42.0, 37.0, 40.0, 51.0, 52.0, 52.0, 53.0, 37.0, 42.0, 41.0, 53.0, 43.0, 31.0, 40.0, 28.0, 36.0, 25.0, 28.0, 20.0, 21.0, 17.0, 14.0, 8.0, 15.0, 8.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.163835525512695, -23.426963806152344, -22.690092086791992, -21.95322036743164, -21.216346740722656, -20.479475021362305, -19.742603302001953, -19.0057315826416, -18.26885986328125, -17.5319881439209, -16.795116424560547, -16.058242797851562, -15.321371078491211, -14.58449935913086, -13.847627639770508, -13.110755920410156, -12.373882293701172, -11.63701057434082, -10.900137901306152, -10.1632661819458, -9.426393508911133, -8.689521789550781, -7.95265007019043, -7.21577787399292, -6.47890567779541, -5.7420334815979, -5.005161285400391, -4.268289566040039, -3.5314173698425293, -2.7945451736450195, -2.057673454284668, -1.3208012580871582, -0.5839309692382812, 0.15294110774993896, 0.8898131847381592, 1.6266851425170898, 2.3635573387145996, 3.1004295349121094, 3.837301254272461, 4.574173450469971, 5.3110456466674805, 6.04791784286499, 6.7847900390625, 7.521661758422852, 8.258533477783203, 8.995406150817871, 9.732277870178223, 10.46915054321289, 11.206022262573242, 11.942893981933594, 12.679766654968262, 13.416638374328613, 14.153511047363281, 14.890382766723633, 15.627254486083984, 16.364126205444336, 17.100997924804688, 17.83786964416504, 18.57474136352539, 19.311614990234375, 20.048486709594727, 20.785358428955078, 21.52223014831543, 22.25910186767578, 22.995975494384766]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 7.0, 12.0, 20.0, 18.0, 36.0, 50.0, 78.0, 116.0, 191.0, 234.0, 361.0, 570.0, 798.0, 1306.0, 2039.0, 3274.0, 5732.0, 11406.0, 25847.0, 73771.0, 295413.0, 444674.0, 113605.0, 35939.0, 14796.0, 7288.0, 4052.0, 2450.0, 1498.0, 968.0, 661.0, 415.0, 297.0, 195.0, 145.0, 104.0, 66.0, 33.0, 31.0, 12.0, 17.0, 14.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.375, -5.21771240234375, -5.0604248046875, -4.90313720703125, -4.745849609375, -4.58856201171875, -4.4312744140625, -4.27398681640625, -4.11669921875, -3.95941162109375, -3.8021240234375, -3.64483642578125, -3.487548828125, -3.33026123046875, -3.1729736328125, -3.01568603515625, -2.8583984375, -2.70111083984375, -2.5438232421875, -2.38653564453125, -2.229248046875, -2.07196044921875, -1.9146728515625, -1.75738525390625, -1.60009765625, -1.44281005859375, -1.2855224609375, -1.12823486328125, -0.970947265625, -0.81365966796875, -0.6563720703125, -0.49908447265625, -0.341796875, -0.18450927734375, -0.0272216796875, 0.13006591796875, 0.287353515625, 0.44464111328125, 0.6019287109375, 0.75921630859375, 0.91650390625, 1.07379150390625, 1.2310791015625, 1.38836669921875, 1.545654296875, 1.70294189453125, 1.8602294921875, 2.01751708984375, 2.1748046875, 2.33209228515625, 2.4893798828125, 2.64666748046875, 2.803955078125, 2.96124267578125, 3.1185302734375, 3.27581787109375, 3.43310546875, 3.59039306640625, 3.7476806640625, 3.90496826171875, 4.062255859375, 4.21954345703125, 4.3768310546875, 4.53411865234375, 4.69140625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 6.0, 7.0, 8.0, 7.0, 24.0, 27.0, 43.0, 53.0, 67.0, 102.0, 116.0, 96.0, 108.0, 86.0, 60.0, 49.0, 33.0, 19.0, 20.0, 10.0, 10.0, 7.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 0.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.017578125, -1.95147705078125, -1.8853759765625, -1.81927490234375, -1.753173828125, -1.68707275390625, -1.6209716796875, -1.55487060546875, -1.48876953125, -1.42266845703125, -1.3565673828125, -1.29046630859375, -1.224365234375, -1.15826416015625, -1.0921630859375, -1.02606201171875, -0.9599609375, -0.89385986328125, -0.8277587890625, -0.76165771484375, -0.695556640625, -0.62945556640625, -0.5633544921875, -0.49725341796875, -0.43115234375, -0.36505126953125, -0.2989501953125, -0.23284912109375, -0.166748046875, -0.10064697265625, -0.0345458984375, 0.03155517578125, 0.09765625, 0.16375732421875, 0.2298583984375, 0.29595947265625, 0.362060546875, 0.42816162109375, 0.4942626953125, 0.56036376953125, 0.62646484375, 0.69256591796875, 0.7586669921875, 0.82476806640625, 0.890869140625, 0.95697021484375, 1.0230712890625, 1.08917236328125, 1.1552734375, 1.22137451171875, 1.2874755859375, 1.35357666015625, 1.419677734375, 1.48577880859375, 1.5518798828125, 1.61798095703125, 1.68408203125, 1.75018310546875, 1.8162841796875, 1.88238525390625, 1.948486328125, 2.01458740234375, 2.0806884765625, 2.14678955078125, 2.212890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 7.0, 17.0, 23.0, 38.0, 43.0, 75.0, 146.0, 225.0, 444.0, 810.0, 1809.0, 4006.0, 9711.0, 25965.0, 85299.0, 351550.0, 418175.0, 100910.0, 30342.0, 10612.0, 4368.0, 1927.0, 985.0, 475.0, 244.0, 115.0, 82.0, 53.0, 23.0, 25.0, 10.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.875, -8.6065673828125, -8.338134765625, -8.0697021484375, -7.80126953125, -7.5328369140625, -7.264404296875, -6.9959716796875, -6.7275390625, -6.4591064453125, -6.190673828125, -5.9222412109375, -5.65380859375, -5.3853759765625, -5.116943359375, -4.8485107421875, -4.580078125, -4.3116455078125, -4.043212890625, -3.7747802734375, -3.50634765625, -3.2379150390625, -2.969482421875, -2.7010498046875, -2.4326171875, -2.1641845703125, -1.895751953125, -1.6273193359375, -1.35888671875, -1.0904541015625, -0.822021484375, -0.5535888671875, -0.28515625, -0.0167236328125, 0.251708984375, 0.5201416015625, 0.78857421875, 1.0570068359375, 1.325439453125, 1.5938720703125, 1.8623046875, 2.1307373046875, 2.399169921875, 2.6676025390625, 2.93603515625, 3.2044677734375, 3.472900390625, 3.7413330078125, 4.009765625, 4.2781982421875, 4.546630859375, 4.8150634765625, 5.08349609375, 5.3519287109375, 5.620361328125, 5.8887939453125, 6.1572265625, 6.4256591796875, 6.694091796875, 6.9625244140625, 7.23095703125, 7.4993896484375, 7.767822265625, 8.0362548828125, 8.3046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 6.0, 7.0, 5.0, 12.0, 7.0, 16.0, 13.0, 19.0, 20.0, 19.0, 22.0, 40.0, 31.0, 26.0, 40.0, 33.0, 37.0, 42.0, 30.0, 39.0, 48.0, 39.0, 50.0, 39.0, 35.0, 31.0, 41.0, 31.0, 30.0, 28.0, 25.0, 29.0, 18.0, 11.0, 8.0, 15.0, 15.0, 9.0, 4.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.25390625, -7.01971435546875, -6.7855224609375, -6.55133056640625, -6.317138671875, -6.08294677734375, -5.8487548828125, -5.61456298828125, -5.38037109375, -5.14617919921875, -4.9119873046875, -4.67779541015625, -4.443603515625, -4.20941162109375, -3.9752197265625, -3.74102783203125, -3.5068359375, -3.27264404296875, -3.0384521484375, -2.80426025390625, -2.570068359375, -2.33587646484375, -2.1016845703125, -1.86749267578125, -1.63330078125, -1.39910888671875, -1.1649169921875, -0.93072509765625, -0.696533203125, -0.46234130859375, -0.2281494140625, 0.00604248046875, 0.240234375, 0.47442626953125, 0.7086181640625, 0.94281005859375, 1.177001953125, 1.41119384765625, 1.6453857421875, 1.87957763671875, 2.11376953125, 2.34796142578125, 2.5821533203125, 2.81634521484375, 3.050537109375, 3.28472900390625, 3.5189208984375, 3.75311279296875, 3.9873046875, 4.22149658203125, 4.4556884765625, 4.68988037109375, 4.924072265625, 5.15826416015625, 5.3924560546875, 5.62664794921875, 5.86083984375, 6.09503173828125, 6.3292236328125, 6.56341552734375, 6.797607421875, 7.03179931640625, 7.2659912109375, 7.50018310546875, 7.734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 12.0, 16.0, 17.0, 24.0, 41.0, 63.0, 128.0, 197.0, 400.0, 1002.0, 2643.0, 9029.0, 44812.0, 429286.0, 494047.0, 51843.0, 10021.0, 2913.0, 1008.0, 449.0, 269.0, 126.0, 77.0, 43.0, 24.0, 28.0, 12.0, 10.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0625, -5.79931640625, -5.5361328125, -5.27294921875, -5.009765625, -4.74658203125, -4.4833984375, -4.22021484375, -3.95703125, -3.69384765625, -3.4306640625, -3.16748046875, -2.904296875, -2.64111328125, -2.3779296875, -2.11474609375, -1.8515625, -1.58837890625, -1.3251953125, -1.06201171875, -0.798828125, -0.53564453125, -0.2724609375, -0.00927734375, 0.25390625, 0.51708984375, 0.7802734375, 1.04345703125, 1.306640625, 1.56982421875, 1.8330078125, 2.09619140625, 2.359375, 2.62255859375, 2.8857421875, 3.14892578125, 3.412109375, 3.67529296875, 3.9384765625, 4.20166015625, 4.46484375, 4.72802734375, 4.9912109375, 5.25439453125, 5.517578125, 5.78076171875, 6.0439453125, 6.30712890625, 6.5703125, 6.83349609375, 7.0966796875, 7.35986328125, 7.623046875, 7.88623046875, 8.1494140625, 8.41259765625, 8.67578125, 8.93896484375, 9.2021484375, 9.46533203125, 9.728515625, 9.99169921875, 10.2548828125, 10.51806640625, 10.78125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 6.0, 9.0, 5.0, 9.0, 22.0, 18.0, 24.0, 35.0, 38.0, 51.0, 65.0, 69.0, 93.0, 103.0, 96.0, 68.0, 42.0, 70.0, 42.0, 35.0, 21.0, 22.0, 19.0, 17.0, 10.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00034427642822265625, -0.00033511221408843994, -0.00032594799995422363, -0.0003167837858200073, -0.000307619571685791, -0.0002984553575515747, -0.0002892911434173584, -0.0002801269292831421, -0.0002709627151489258, -0.00026179850101470947, -0.00025263428688049316, -0.00024347007274627686, -0.00023430585861206055, -0.00022514164447784424, -0.00021597743034362793, -0.00020681321620941162, -0.0001976490020751953, -0.000188484787940979, -0.0001793205738067627, -0.0001701563596725464, -0.00016099214553833008, -0.00015182793140411377, -0.00014266371726989746, -0.00013349950313568115, -0.00012433528900146484, -0.00011517107486724854, -0.00010600686073303223, -9.684264659881592e-05, -8.767843246459961e-05, -7.85142183303833e-05, -6.935000419616699e-05, -6.0185790061950684e-05, -5.1021575927734375e-05, -4.1857361793518066e-05, -3.269314765930176e-05, -2.352893352508545e-05, -1.436471939086914e-05, -5.200505256652832e-06, 3.9637088775634766e-06, 1.3127923011779785e-05, 2.2292137145996094e-05, 3.14563512802124e-05, 4.062056541442871e-05, 4.978477954864502e-05, 5.894899368286133e-05, 6.811320781707764e-05, 7.727742195129395e-05, 8.644163608551025e-05, 9.560585021972656e-05, 0.00010477006435394287, 0.00011393427848815918, 0.0001230984926223755, 0.0001322627067565918, 0.0001414269208908081, 0.00015059113502502441, 0.00015975534915924072, 0.00016891956329345703, 0.00017808377742767334, 0.00018724799156188965, 0.00019641220569610596, 0.00020557641983032227, 0.00021474063396453857, 0.00022390484809875488, 0.0002330690622329712, 0.0002422332763671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 3.0, 10.0, 12.0, 25.0, 30.0, 51.0, 79.0, 120.0, 173.0, 316.0, 517.0, 931.0, 1768.0, 3520.0, 7702.0, 18932.0, 56234.0, 205305.0, 463074.0, 200860.0, 55350.0, 18446.0, 7540.0, 3505.0, 1776.0, 924.0, 521.0, 304.0, 206.0, 117.0, 71.0, 37.0, 24.0, 24.0, 10.0, 9.0, 11.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.9609375, -4.80340576171875, -4.6458740234375, -4.48834228515625, -4.330810546875, -4.17327880859375, -4.0157470703125, -3.85821533203125, -3.70068359375, -3.54315185546875, -3.3856201171875, -3.22808837890625, -3.070556640625, -2.91302490234375, -2.7554931640625, -2.59796142578125, -2.4404296875, -2.28289794921875, -2.1253662109375, -1.96783447265625, -1.810302734375, -1.65277099609375, -1.4952392578125, -1.33770751953125, -1.18017578125, -1.02264404296875, -0.8651123046875, -0.70758056640625, -0.550048828125, -0.39251708984375, -0.2349853515625, -0.07745361328125, 0.080078125, 0.23760986328125, 0.3951416015625, 0.55267333984375, 0.710205078125, 0.86773681640625, 1.0252685546875, 1.18280029296875, 1.34033203125, 1.49786376953125, 1.6553955078125, 1.81292724609375, 1.970458984375, 2.12799072265625, 2.2855224609375, 2.44305419921875, 2.6005859375, 2.75811767578125, 2.9156494140625, 3.07318115234375, 3.230712890625, 3.38824462890625, 3.5457763671875, 3.70330810546875, 3.86083984375, 4.01837158203125, 4.1759033203125, 4.33343505859375, 4.490966796875, 4.64849853515625, 4.8060302734375, 4.96356201171875, 5.12109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 7.0, 10.0, 11.0, 12.0, 13.0, 26.0, 20.0, 28.0, 39.0, 45.0, 43.0, 46.0, 74.0, 69.0, 75.0, 63.0, 69.0, 46.0, 48.0, 43.0, 43.0, 37.0, 28.0, 19.0, 20.0, 12.0, 13.0, 7.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.769989013671875, -2.65911865234375, -2.548248291015625, -2.4373779296875, -2.326507568359375, -2.21563720703125, -2.104766845703125, -1.993896484375, -1.883026123046875, -1.77215576171875, -1.661285400390625, -1.5504150390625, -1.439544677734375, -1.32867431640625, -1.217803955078125, -1.10693359375, -0.996063232421875, -0.88519287109375, -0.774322509765625, -0.6634521484375, -0.552581787109375, -0.44171142578125, -0.330841064453125, -0.219970703125, -0.109100341796875, 0.00177001953125, 0.112640380859375, 0.2235107421875, 0.334381103515625, 0.44525146484375, 0.556121826171875, 0.6669921875, 0.777862548828125, 0.88873291015625, 0.999603271484375, 1.1104736328125, 1.221343994140625, 1.33221435546875, 1.443084716796875, 1.553955078125, 1.664825439453125, 1.77569580078125, 1.886566162109375, 1.9974365234375, 2.108306884765625, 2.21917724609375, 2.330047607421875, 2.44091796875, 2.551788330078125, 2.66265869140625, 2.773529052734375, 2.8843994140625, 2.995269775390625, 3.10614013671875, 3.217010498046875, 3.327880859375, 3.438751220703125, 3.54962158203125, 3.660491943359375, 3.7713623046875, 3.882232666015625, 3.99310302734375, 4.103973388671875, 4.21484375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 10.0, 11.0, 10.0, 40.0, 68.0, 218.0, 344.0, 151.0, 81.0, 25.0, 24.0, 6.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.21674346923828, -59.088218688964844, -54.959693908691406, -50.83116912841797, -46.70264434814453, -42.574119567871094, -38.44559860229492, -34.317073822021484, -30.188549041748047, -26.06002426147461, -21.931499481201172, -17.802976608276367, -13.67445182800293, -9.545927047729492, -5.4174041748046875, -1.28887939453125, 2.8396453857421875, 6.968169689178467, 11.096693992614746, 15.225217819213867, 19.353742599487305, 23.482267379760742, 27.610790252685547, 31.739315032958984, 35.86783981323242, 39.99636459350586, 44.1248893737793, 48.25341033935547, 52.381935119628906, 56.510459899902344, 60.63898468017578, 64.76750946044922, 68.89604187011719, 73.02456665039062, 77.15309143066406, 81.2816162109375, 85.41014099121094, 89.53866577148438, 93.66719055175781, 97.79571533203125, 101.92424011230469, 106.05276489257812, 110.18128967285156, 114.309814453125, 118.43833923339844, 122.56686401367188, 126.69538879394531, 130.82391357421875, 134.95242309570312, 139.08094787597656, 143.20947265625, 147.33799743652344, 151.46652221679688, 155.5950469970703, 159.72357177734375, 163.8520965576172, 167.98062133789062, 172.10914611816406, 176.2376708984375, 180.36619567871094, 184.49472045898438, 188.6232452392578, 192.75177001953125, 196.8802947998047, 201.00881958007812]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 1.0, 4.0, 4.0, 8.0, 9.0, 22.0, 27.0, 69.0, 104.0, 154.0, 159.0, 124.0, 121.0, 60.0, 33.0, 22.0, 16.0, 6.0, 5.0, 5.0, 11.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.57891845703125, -139.5331573486328, -134.4873809814453, -129.44161987304688, -124.3958511352539, -119.35008239746094, -114.3043212890625, -109.25855255126953, -104.21278381347656, -99.1670150756836, -94.12124633789062, -89.07548522949219, -84.02971649169922, -78.98394775390625, -73.93818664550781, -68.89241790771484, -63.846649169921875, -58.800880432128906, -53.7551155090332, -48.7093505859375, -43.66358184814453, -38.61781311035156, -33.57204818725586, -28.526283264160156, -23.480514526367188, -18.43474769592285, -13.388980865478516, -8.34321403503418, -3.2974472045898438, 1.7483196258544922, 6.794086456298828, 11.839851379394531, 16.885635375976562, 21.9314022064209, 26.977169036865234, 32.02293395996094, 37.068702697753906, 42.114471435546875, 47.16023635864258, 52.20600128173828, 57.25177001953125, 62.29753875732422, 67.34330749511719, 72.38906860351562, 77.4348373413086, 82.48060607910156, 87.5263671875, 92.57213592529297, 97.61790466308594, 102.6636734008789, 107.70944213867188, 112.75520324707031, 117.80097198486328, 122.84674072265625, 127.89250183105469, 132.93826293945312, 137.98403930664062, 143.02980041503906, 148.07557678222656, 153.121337890625, 158.1671142578125, 163.21287536621094, 168.25863647460938, 173.30441284179688, 178.3501739501953]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 3.0, 8.0, 4.0, 5.0, 6.0, 14.0, 13.0, 21.0, 32.0, 50.0, 101.0, 191.0, 351.0, 680.0, 1523.0, 4169.0, 13335.0, 73131.0, 3603114.0, 447629.0, 35587.0, 8536.0, 2987.0, 1292.0, 627.0, 346.0, 215.0, 105.0, 68.0, 48.0, 31.0, 15.0, 12.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.359375, -23.291748046875, -22.22412109375, -21.156494140625, -20.0888671875, -19.021240234375, -17.95361328125, -16.885986328125, -15.818359375, -14.750732421875, -13.68310546875, -12.615478515625, -11.5478515625, -10.480224609375, -9.41259765625, -8.344970703125, -7.27734375, -6.209716796875, -5.14208984375, -4.074462890625, -3.0068359375, -1.939208984375, -0.87158203125, 0.196044921875, 1.263671875, 2.331298828125, 3.39892578125, 4.466552734375, 5.5341796875, 6.601806640625, 7.66943359375, 8.737060546875, 9.8046875, 10.872314453125, 11.93994140625, 13.007568359375, 14.0751953125, 15.142822265625, 16.21044921875, 17.278076171875, 18.345703125, 19.413330078125, 20.48095703125, 21.548583984375, 22.6162109375, 23.683837890625, 24.75146484375, 25.819091796875, 26.88671875, 27.954345703125, 29.02197265625, 30.089599609375, 31.1572265625, 32.224853515625, 33.29248046875, 34.360107421875, 35.427734375, 36.495361328125, 37.56298828125, 38.630615234375, 39.6982421875, 40.765869140625, 41.83349609375, 42.901123046875, 43.96875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 9.0, 6.0, 11.0, 5.0, 15.0, 23.0, 28.0, 39.0, 41.0, 59.0, 74.0, 69.0, 87.0, 92.0, 78.0, 65.0, 58.0, 45.0, 44.0, 30.0, 33.0, 18.0, 20.0, 7.0, 11.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3984375, -1.343658447265625, -1.28887939453125, -1.234100341796875, -1.1793212890625, -1.124542236328125, -1.06976318359375, -1.014984130859375, -0.960205078125, -0.905426025390625, -0.85064697265625, -0.795867919921875, -0.7410888671875, -0.686309814453125, -0.63153076171875, -0.576751708984375, -0.52197265625, -0.467193603515625, -0.41241455078125, -0.357635498046875, -0.3028564453125, -0.248077392578125, -0.19329833984375, -0.138519287109375, -0.083740234375, -0.028961181640625, 0.02581787109375, 0.080596923828125, 0.1353759765625, 0.190155029296875, 0.24493408203125, 0.299713134765625, 0.3544921875, 0.409271240234375, 0.46405029296875, 0.518829345703125, 0.5736083984375, 0.628387451171875, 0.68316650390625, 0.737945556640625, 0.792724609375, 0.847503662109375, 0.90228271484375, 0.957061767578125, 1.0118408203125, 1.066619873046875, 1.12139892578125, 1.176177978515625, 1.23095703125, 1.285736083984375, 1.34051513671875, 1.395294189453125, 1.4500732421875, 1.504852294921875, 1.55963134765625, 1.614410400390625, 1.669189453125, 1.723968505859375, 1.77874755859375, 1.833526611328125, 1.8883056640625, 1.943084716796875, 1.99786376953125, 2.052642822265625, 2.107421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 21.0, 25.0, 41.0, 76.0, 89.0, 182.0, 289.0, 468.0, 877.0, 1750.0, 3766.0, 8902.0, 22183.0, 68441.0, 295146.0, 3023586.0, 603608.0, 109519.0, 32739.0, 12196.0, 5233.0, 2369.0, 1150.0, 637.0, 380.0, 194.0, 127.0, 91.0, 72.0, 32.0, 20.0, 21.0, 7.0, 11.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-17.765625, -17.1865234375, -16.607421875, -16.0283203125, -15.44921875, -14.8701171875, -14.291015625, -13.7119140625, -13.1328125, -12.5537109375, -11.974609375, -11.3955078125, -10.81640625, -10.2373046875, -9.658203125, -9.0791015625, -8.5, -7.9208984375, -7.341796875, -6.7626953125, -6.18359375, -5.6044921875, -5.025390625, -4.4462890625, -3.8671875, -3.2880859375, -2.708984375, -2.1298828125, -1.55078125, -0.9716796875, -0.392578125, 0.1865234375, 0.765625, 1.3447265625, 1.923828125, 2.5029296875, 3.08203125, 3.6611328125, 4.240234375, 4.8193359375, 5.3984375, 5.9775390625, 6.556640625, 7.1357421875, 7.71484375, 8.2939453125, 8.873046875, 9.4521484375, 10.03125, 10.6103515625, 11.189453125, 11.7685546875, 12.34765625, 12.9267578125, 13.505859375, 14.0849609375, 14.6640625, 15.2431640625, 15.822265625, 16.4013671875, 16.98046875, 17.5595703125, 18.138671875, 18.7177734375, 19.296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 12.0, 18.0, 22.0, 18.0, 45.0, 60.0, 89.0, 131.0, 253.0, 445.0, 1492.0, 626.0, 302.0, 158.0, 107.0, 72.0, 65.0, 39.0, 17.0, 18.0, 11.0, 13.0, 8.0, 14.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.4453125, -3.339935302734375, -3.23455810546875, -3.129180908203125, -3.0238037109375, -2.918426513671875, -2.81304931640625, -2.707672119140625, -2.602294921875, -2.496917724609375, -2.39154052734375, -2.286163330078125, -2.1807861328125, -2.075408935546875, -1.97003173828125, -1.864654541015625, -1.75927734375, -1.653900146484375, -1.54852294921875, -1.443145751953125, -1.3377685546875, -1.232391357421875, -1.12701416015625, -1.021636962890625, -0.916259765625, -0.810882568359375, -0.70550537109375, -0.600128173828125, -0.4947509765625, -0.389373779296875, -0.28399658203125, -0.178619384765625, -0.0732421875, 0.032135009765625, 0.13751220703125, 0.242889404296875, 0.3482666015625, 0.453643798828125, 0.55902099609375, 0.664398193359375, 0.769775390625, 0.875152587890625, 0.98052978515625, 1.085906982421875, 1.1912841796875, 1.296661376953125, 1.40203857421875, 1.507415771484375, 1.61279296875, 1.718170166015625, 1.82354736328125, 1.928924560546875, 2.0343017578125, 2.139678955078125, 2.24505615234375, 2.350433349609375, 2.455810546875, 2.561187744140625, 2.66656494140625, 2.771942138671875, 2.8773193359375, 2.982696533203125, 3.08807373046875, 3.193450927734375, 3.298828125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 24.0, 33.0, 83.0, 127.0, 197.0, 192.0, 130.0, 87.0, 49.0, 23.0, 13.0, 8.0, 7.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.113744735717773, -17.041501998901367, -15.969259262084961, -14.897016525268555, -13.824773788452148, -12.752531051635742, -11.680288314819336, -10.60804557800293, -9.535802841186523, -8.463560104370117, -7.391317367553711, -6.319074630737305, -5.246831893920898, -4.174589157104492, -3.102346420288086, -2.0301036834716797, -0.9578609466552734, 0.11438179016113281, 1.186624526977539, 2.2588672637939453, 3.3311100006103516, 4.403352737426758, 5.475595474243164, 6.54783821105957, 7.620080947875977, 8.692323684692383, 9.764566421508789, 10.836809158325195, 11.909051895141602, 12.981294631958008, 14.053537368774414, 15.12578010559082, 16.19802474975586, 17.270267486572266, 18.342510223388672, 19.414752960205078, 20.486995697021484, 21.55923843383789, 22.631481170654297, 23.703723907470703, 24.77596664428711, 25.848209381103516, 26.920452117919922, 27.992694854736328, 29.064937591552734, 30.13718032836914, 31.209423065185547, 32.28166580200195, 33.35390853881836, 34.426151275634766, 35.49839401245117, 36.57063674926758, 37.642879486083984, 38.71512222290039, 39.7873649597168, 40.8596076965332, 41.93185043334961, 43.004093170166016, 44.07633590698242, 45.14857864379883, 46.220821380615234, 47.29306411743164, 48.36530685424805, 49.43754959106445, 50.50979232788086]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 4.0, 7.0, 14.0, 15.0, 15.0, 22.0, 28.0, 26.0, 48.0, 31.0, 62.0, 62.0, 59.0, 58.0, 62.0, 64.0, 55.0, 67.0, 45.0, 45.0, 42.0, 39.0, 31.0, 20.0, 19.0, 16.0, 14.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.030752182006836, -21.472139358520508, -20.913524627685547, -20.35491180419922, -19.79629898071289, -19.237686157226562, -18.679073333740234, -18.120458602905273, -17.561845779418945, -17.003232955932617, -16.444618225097656, -15.886005401611328, -15.327392578125, -14.768779754638672, -14.210165977478027, -13.651552200317383, -13.092939376831055, -12.534326553344727, -11.975712776184082, -11.417098999023438, -10.85848617553711, -10.299873352050781, -9.741259574890137, -9.182645797729492, -8.624032974243164, -8.065420150756836, -7.506806373596191, -6.948193073272705, -6.389579772949219, -5.830966472625732, -5.272353172302246, -4.71373987197876, -4.155128479003906, -3.59651517868042, -3.0379018783569336, -2.4792885780334473, -1.920675277709961, -1.3620619773864746, -0.8034486770629883, -0.24483537673950195, 0.3137779235839844, 0.8723912239074707, 1.431004524230957, 1.9896178245544434, 2.5482311248779297, 3.106844425201416, 3.6654577255249023, 4.224071025848389, 4.782684326171875, 5.341297626495361, 5.899910926818848, 6.458524227142334, 7.01713752746582, 7.575750827789307, 8.134364128112793, 8.692977905273438, 9.251590728759766, 9.810203552246094, 10.368817329406738, 10.927431106567383, 11.486043930053711, 12.044656753540039, 12.603270530700684, 13.161884307861328, 13.720497131347656]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 9.0, 6.0, 17.0, 23.0, 20.0, 37.0, 34.0, 84.0, 108.0, 189.0, 283.0, 433.0, 708.0, 1379.0, 2628.0, 5434.0, 13108.0, 37763.0, 133118.0, 430730.0, 300114.0, 80003.0, 24387.0, 9306.0, 4053.0, 1898.0, 1026.0, 626.0, 339.0, 253.0, 139.0, 87.0, 54.0, 38.0, 30.0, 12.0, 16.0, 15.0, 7.0, 9.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.1171875, -13.67333984375, -13.2294921875, -12.78564453125, -12.341796875, -11.89794921875, -11.4541015625, -11.01025390625, -10.56640625, -10.12255859375, -9.6787109375, -9.23486328125, -8.791015625, -8.34716796875, -7.9033203125, -7.45947265625, -7.015625, -6.57177734375, -6.1279296875, -5.68408203125, -5.240234375, -4.79638671875, -4.3525390625, -3.90869140625, -3.46484375, -3.02099609375, -2.5771484375, -2.13330078125, -1.689453125, -1.24560546875, -0.8017578125, -0.35791015625, 0.0859375, 0.52978515625, 0.9736328125, 1.41748046875, 1.861328125, 2.30517578125, 2.7490234375, 3.19287109375, 3.63671875, 4.08056640625, 4.5244140625, 4.96826171875, 5.412109375, 5.85595703125, 6.2998046875, 6.74365234375, 7.1875, 7.63134765625, 8.0751953125, 8.51904296875, 8.962890625, 9.40673828125, 9.8505859375, 10.29443359375, 10.73828125, 11.18212890625, 11.6259765625, 12.06982421875, 12.513671875, 12.95751953125, 13.4013671875, 13.84521484375, 14.2890625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 9.0, 13.0, 12.0, 19.0, 22.0, 29.0, 38.0, 51.0, 55.0, 42.0, 62.0, 81.0, 81.0, 68.0, 63.0, 69.0, 48.0, 46.0, 29.0, 26.0, 22.0, 21.0, 14.0, 17.0, 10.0, 10.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.35546875, -1.3050537109375, -1.254638671875, -1.2042236328125, -1.15380859375, -1.1033935546875, -1.052978515625, -1.0025634765625, -0.9521484375, -0.9017333984375, -0.851318359375, -0.8009033203125, -0.75048828125, -0.7000732421875, -0.649658203125, -0.5992431640625, -0.548828125, -0.4984130859375, -0.447998046875, -0.3975830078125, -0.34716796875, -0.2967529296875, -0.246337890625, -0.1959228515625, -0.1455078125, -0.0950927734375, -0.044677734375, 0.0057373046875, 0.05615234375, 0.1065673828125, 0.156982421875, 0.2073974609375, 0.2578125, 0.3082275390625, 0.358642578125, 0.4090576171875, 0.45947265625, 0.5098876953125, 0.560302734375, 0.6107177734375, 0.6611328125, 0.7115478515625, 0.761962890625, 0.8123779296875, 0.86279296875, 0.9132080078125, 0.963623046875, 1.0140380859375, 1.064453125, 1.1148681640625, 1.165283203125, 1.2156982421875, 1.26611328125, 1.3165283203125, 1.366943359375, 1.4173583984375, 1.4677734375, 1.5181884765625, 1.568603515625, 1.6190185546875, 1.66943359375, 1.7198486328125, 1.770263671875, 1.8206787109375, 1.87109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 11.0, 11.0, 27.0, 26.0, 37.0, 70.0, 82.0, 167.0, 270.0, 424.0, 694.0, 1268.0, 2441.0, 5289.0, 14623.0, 59179.0, 357232.0, 488431.0, 86803.0, 19069.0, 6303.0, 2708.0, 1399.0, 787.0, 439.0, 269.0, 172.0, 96.0, 75.0, 42.0, 30.0, 28.0, 11.0, 11.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.8984375, -14.4345703125, -13.970703125, -13.5068359375, -13.04296875, -12.5791015625, -12.115234375, -11.6513671875, -11.1875, -10.7236328125, -10.259765625, -9.7958984375, -9.33203125, -8.8681640625, -8.404296875, -7.9404296875, -7.4765625, -7.0126953125, -6.548828125, -6.0849609375, -5.62109375, -5.1572265625, -4.693359375, -4.2294921875, -3.765625, -3.3017578125, -2.837890625, -2.3740234375, -1.91015625, -1.4462890625, -0.982421875, -0.5185546875, -0.0546875, 0.4091796875, 0.873046875, 1.3369140625, 1.80078125, 2.2646484375, 2.728515625, 3.1923828125, 3.65625, 4.1201171875, 4.583984375, 5.0478515625, 5.51171875, 5.9755859375, 6.439453125, 6.9033203125, 7.3671875, 7.8310546875, 8.294921875, 8.7587890625, 9.22265625, 9.6865234375, 10.150390625, 10.6142578125, 11.078125, 11.5419921875, 12.005859375, 12.4697265625, 12.93359375, 13.3974609375, 13.861328125, 14.3251953125, 14.7890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 9.0, 7.0, 14.0, 25.0, 26.0, 40.0, 33.0, 48.0, 50.0, 61.0, 72.0, 81.0, 80.0, 73.0, 63.0, 69.0, 52.0, 49.0, 35.0, 25.0, 24.0, 15.0, 17.0, 9.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.421875, -10.1279296875, -9.833984375, -9.5400390625, -9.24609375, -8.9521484375, -8.658203125, -8.3642578125, -8.0703125, -7.7763671875, -7.482421875, -7.1884765625, -6.89453125, -6.6005859375, -6.306640625, -6.0126953125, -5.71875, -5.4248046875, -5.130859375, -4.8369140625, -4.54296875, -4.2490234375, -3.955078125, -3.6611328125, -3.3671875, -3.0732421875, -2.779296875, -2.4853515625, -2.19140625, -1.8974609375, -1.603515625, -1.3095703125, -1.015625, -0.7216796875, -0.427734375, -0.1337890625, 0.16015625, 0.4541015625, 0.748046875, 1.0419921875, 1.3359375, 1.6298828125, 1.923828125, 2.2177734375, 2.51171875, 2.8056640625, 3.099609375, 3.3935546875, 3.6875, 3.9814453125, 4.275390625, 4.5693359375, 4.86328125, 5.1572265625, 5.451171875, 5.7451171875, 6.0390625, 6.3330078125, 6.626953125, 6.9208984375, 7.21484375, 7.5087890625, 7.802734375, 8.0966796875, 8.390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 5.0, 12.0, 12.0, 22.0, 31.0, 41.0, 73.0, 120.0, 223.0, 374.0, 751.0, 1648.0, 4099.0, 12668.0, 56752.0, 379053.0, 488408.0, 79626.0, 15850.0, 5031.0, 1878.0, 862.0, 433.0, 226.0, 123.0, 80.0, 56.0, 34.0, 19.0, 16.0, 11.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.8125, -21.2545166015625, -20.696533203125, -20.1385498046875, -19.58056640625, -19.0225830078125, -18.464599609375, -17.9066162109375, -17.3486328125, -16.7906494140625, -16.232666015625, -15.6746826171875, -15.11669921875, -14.5587158203125, -14.000732421875, -13.4427490234375, -12.884765625, -12.3267822265625, -11.768798828125, -11.2108154296875, -10.65283203125, -10.0948486328125, -9.536865234375, -8.9788818359375, -8.4208984375, -7.8629150390625, -7.304931640625, -6.7469482421875, -6.18896484375, -5.6309814453125, -5.072998046875, -4.5150146484375, -3.95703125, -3.3990478515625, -2.841064453125, -2.2830810546875, -1.72509765625, -1.1671142578125, -0.609130859375, -0.0511474609375, 0.5068359375, 1.0648193359375, 1.622802734375, 2.1807861328125, 2.73876953125, 3.2967529296875, 3.854736328125, 4.4127197265625, 4.970703125, 5.5286865234375, 6.086669921875, 6.6446533203125, 7.20263671875, 7.7606201171875, 8.318603515625, 8.8765869140625, 9.4345703125, 9.9925537109375, 10.550537109375, 11.1085205078125, 11.66650390625, 12.2244873046875, 12.782470703125, 13.3404541015625, 13.8984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 19.0, 37.0, 97.0, 160.0, 247.0, 193.0, 102.0, 51.0, 34.0, 13.0, 5.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019741058349609375, -0.001913607120513916, -0.0018531084060668945, -0.001792609691619873, -0.0017321109771728516, -0.00167161226272583, -0.0016111135482788086, -0.0015506148338317871, -0.0014901161193847656, -0.0014296174049377441, -0.0013691186904907227, -0.0013086199760437012, -0.0012481212615966797, -0.0011876225471496582, -0.0011271238327026367, -0.0010666251182556152, -0.0010061264038085938, -0.0009456276893615723, -0.0008851289749145508, -0.0008246302604675293, -0.0007641315460205078, -0.0007036328315734863, -0.0006431341171264648, -0.0005826354026794434, -0.0005221366882324219, -0.0004616379737854004, -0.0004011392593383789, -0.0003406405448913574, -0.00028014183044433594, -0.00021964311599731445, -0.00015914440155029297, -9.864568710327148e-05, -3.814697265625e-05, 2.2351741790771484e-05, 8.285045623779297e-05, 0.00014334917068481445, 0.00020384788513183594, 0.0002643465995788574, 0.0003248453140258789, 0.0003853440284729004, 0.0004458427429199219, 0.0005063414573669434, 0.0005668401718139648, 0.0006273388862609863, 0.0006878376007080078, 0.0007483363151550293, 0.0008088350296020508, 0.0008693337440490723, 0.0009298324584960938, 0.0009903311729431152, 0.0010508298873901367, 0.0011113286018371582, 0.0011718273162841797, 0.0012323260307312012, 0.0012928247451782227, 0.0013533234596252441, 0.0014138221740722656, 0.0014743208885192871, 0.0015348196029663086, 0.00159531831741333, 0.0016558170318603516, 0.001716315746307373, 0.0017768144607543945, 0.001837313175201416, 0.0018978118896484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 11.0, 12.0, 10.0, 15.0, 31.0, 44.0, 63.0, 75.0, 118.0, 190.0, 283.0, 475.0, 739.0, 1407.0, 2636.0, 5370.0, 12703.0, 37418.0, 134261.0, 410093.0, 311611.0, 86561.0, 25625.0, 9563.0, 4189.0, 2120.0, 1129.0, 660.0, 380.0, 225.0, 183.0, 117.0, 65.0, 42.0, 32.0, 23.0, 21.0, 14.0, 11.0, 9.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-12.921875, -12.5283203125, -12.134765625, -11.7412109375, -11.34765625, -10.9541015625, -10.560546875, -10.1669921875, -9.7734375, -9.3798828125, -8.986328125, -8.5927734375, -8.19921875, -7.8056640625, -7.412109375, -7.0185546875, -6.625, -6.2314453125, -5.837890625, -5.4443359375, -5.05078125, -4.6572265625, -4.263671875, -3.8701171875, -3.4765625, -3.0830078125, -2.689453125, -2.2958984375, -1.90234375, -1.5087890625, -1.115234375, -0.7216796875, -0.328125, 0.0654296875, 0.458984375, 0.8525390625, 1.24609375, 1.6396484375, 2.033203125, 2.4267578125, 2.8203125, 3.2138671875, 3.607421875, 4.0009765625, 4.39453125, 4.7880859375, 5.181640625, 5.5751953125, 5.96875, 6.3623046875, 6.755859375, 7.1494140625, 7.54296875, 7.9365234375, 8.330078125, 8.7236328125, 9.1171875, 9.5107421875, 9.904296875, 10.2978515625, 10.69140625, 11.0849609375, 11.478515625, 11.8720703125, 12.265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 8.0, 7.0, 9.0, 18.0, 27.0, 37.0, 49.0, 59.0, 78.0, 97.0, 111.0, 117.0, 91.0, 82.0, 54.0, 31.0, 34.0, 24.0, 9.0, 12.0, 10.0, 13.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.7171630859375, -8.434326171875, -8.1514892578125, -7.86865234375, -7.5858154296875, -7.302978515625, -7.0201416015625, -6.7373046875, -6.4544677734375, -6.171630859375, -5.8887939453125, -5.60595703125, -5.3231201171875, -5.040283203125, -4.7574462890625, -4.474609375, -4.1917724609375, -3.908935546875, -3.6260986328125, -3.34326171875, -3.0604248046875, -2.777587890625, -2.4947509765625, -2.2119140625, -1.9290771484375, -1.646240234375, -1.3634033203125, -1.08056640625, -0.7977294921875, -0.514892578125, -0.2320556640625, 0.05078125, 0.3336181640625, 0.616455078125, 0.8992919921875, 1.18212890625, 1.4649658203125, 1.747802734375, 2.0306396484375, 2.3134765625, 2.5963134765625, 2.879150390625, 3.1619873046875, 3.44482421875, 3.7276611328125, 4.010498046875, 4.2933349609375, 4.576171875, 4.8590087890625, 5.141845703125, 5.4246826171875, 5.70751953125, 5.9903564453125, 6.273193359375, 6.5560302734375, 6.8388671875, 7.1217041015625, 7.404541015625, 7.6873779296875, 7.97021484375, 8.2530517578125, 8.535888671875, 8.8187255859375, 9.1015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 10.0, 30.0, 74.0, 147.0, 194.0, 208.0, 174.0, 72.0, 36.0, 15.0, 12.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.61133575439453, -82.18106842041016, -78.75079345703125, -75.32052612304688, -71.8902587890625, -68.45999145507812, -65.02972412109375, -61.599449157714844, -58.16918182373047, -54.738914489746094, -51.30864334106445, -47.87837219238281, -44.44810485839844, -41.01783752441406, -37.58756637573242, -34.15729522705078, -30.727027893066406, -27.2967586517334, -23.86648941040039, -20.436220169067383, -17.005950927734375, -13.575681686401367, -10.14541244506836, -6.715143203735352, -3.2848739624023438, 0.14539527893066406, 3.575664520263672, 7.00593376159668, 10.436203002929688, 13.866472244262695, 17.296741485595703, 20.72701072692871, 24.15728759765625, 27.587556838989258, 31.017826080322266, 34.448097229003906, 37.87836456298828, 41.308631896972656, 44.7389030456543, 48.16917419433594, 51.59944152832031, 55.02970886230469, 58.45998001098633, 61.89025115966797, 65.32051849365234, 68.75078582763672, 72.18106079101562, 75.611328125, 79.04159545898438, 82.47186279296875, 85.90213012695312, 89.33240509033203, 92.7626724243164, 96.19293975830078, 99.62321472167969, 103.05348205566406, 106.48374938964844, 109.91401672363281, 113.34428405761719, 116.7745590209961, 120.20482635498047, 123.63509368896484, 127.06536865234375, 130.49563598632812, 133.9259033203125]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 7.0, 6.0, 5.0, 6.0, 8.0, 9.0, 18.0, 19.0, 20.0, 28.0, 34.0, 43.0, 47.0, 44.0, 54.0, 70.0, 56.0, 57.0, 59.0, 57.0, 44.0, 52.0, 43.0, 39.0, 33.0, 21.0, 30.0, 22.0, 12.0, 11.0, 8.0, 10.0, 12.0, 6.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.20018768310547, -44.69313430786133, -43.18608093261719, -41.67902374267578, -40.17197036743164, -38.6649169921875, -37.15786361694336, -35.65081024169922, -34.14375686645508, -32.63670349121094, -31.129648208618164, -29.622594833374023, -28.115541458129883, -26.60848617553711, -25.10143280029297, -23.594379425048828, -22.087324142456055, -20.580270767211914, -19.07321548461914, -17.566162109375, -16.05910873413086, -14.552054405212402, -13.045000076293945, -11.537946701049805, -10.030892372131348, -8.52383804321289, -7.01678466796875, -5.509730339050293, -4.002676486968994, -2.4956226348876953, -0.9885683059692383, 0.5184850692749023, 2.0255393981933594, 3.532593250274658, 5.039647102355957, 6.546701431274414, 8.053754806518555, 9.560809135437012, 11.067863464355469, 12.57491683959961, 14.081971168518066, 15.589025497436523, 17.096078872680664, 18.603134155273438, 20.110187530517578, 21.61724090576172, 23.12429428100586, 24.63134765625, 26.138402938842773, 27.645456314086914, 29.152511596679688, 30.659564971923828, 32.16661834716797, 33.67367172241211, 35.18072509765625, 36.687782287597656, 38.1948356628418, 39.70188903808594, 41.20894241333008, 42.71599578857422, 44.223052978515625, 45.730106353759766, 47.237159729003906, 48.74421310424805, 50.25126647949219]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 6.0, 17.0, 21.0, 27.0, 40.0, 75.0, 99.0, 173.0, 302.0, 546.0, 1012.0, 2177.0, 5043.0, 12167.0, 35190.0, 130661.0, 885802.0, 2806235.0, 227628.0, 54281.0, 18162.0, 7349.0, 3368.0, 1721.0, 896.0, 486.0, 282.0, 171.0, 128.0, 74.0, 36.0, 38.0, 20.0, 8.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.203125, -22.3798828125, -21.556640625, -20.7333984375, -19.91015625, -19.0869140625, -18.263671875, -17.4404296875, -16.6171875, -15.7939453125, -14.970703125, -14.1474609375, -13.32421875, -12.5009765625, -11.677734375, -10.8544921875, -10.03125, -9.2080078125, -8.384765625, -7.5615234375, -6.73828125, -5.9150390625, -5.091796875, -4.2685546875, -3.4453125, -2.6220703125, -1.798828125, -0.9755859375, -0.15234375, 0.6708984375, 1.494140625, 2.3173828125, 3.140625, 3.9638671875, 4.787109375, 5.6103515625, 6.43359375, 7.2568359375, 8.080078125, 8.9033203125, 9.7265625, 10.5498046875, 11.373046875, 12.1962890625, 13.01953125, 13.8427734375, 14.666015625, 15.4892578125, 16.3125, 17.1357421875, 17.958984375, 18.7822265625, 19.60546875, 20.4287109375, 21.251953125, 22.0751953125, 22.8984375, 23.7216796875, 24.544921875, 25.3681640625, 26.19140625, 27.0146484375, 27.837890625, 28.6611328125, 29.484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 9.0, 5.0, 7.0, 8.0, 9.0, 14.0, 21.0, 20.0, 42.0, 37.0, 51.0, 51.0, 71.0, 69.0, 76.0, 89.0, 75.0, 57.0, 62.0, 40.0, 48.0, 33.0, 12.0, 18.0, 21.0, 15.0, 14.0, 9.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.666015625, -1.61114501953125, -1.5562744140625, -1.50140380859375, -1.446533203125, -1.39166259765625, -1.3367919921875, -1.28192138671875, -1.22705078125, -1.17218017578125, -1.1173095703125, -1.06243896484375, -1.007568359375, -0.95269775390625, -0.8978271484375, -0.84295654296875, -0.7880859375, -0.73321533203125, -0.6783447265625, -0.62347412109375, -0.568603515625, -0.51373291015625, -0.4588623046875, -0.40399169921875, -0.34912109375, -0.29425048828125, -0.2393798828125, -0.18450927734375, -0.129638671875, -0.07476806640625, -0.0198974609375, 0.03497314453125, 0.08984375, 0.14471435546875, 0.1995849609375, 0.25445556640625, 0.309326171875, 0.36419677734375, 0.4190673828125, 0.47393798828125, 0.52880859375, 0.58367919921875, 0.6385498046875, 0.69342041015625, 0.748291015625, 0.80316162109375, 0.8580322265625, 0.91290283203125, 0.9677734375, 1.02264404296875, 1.0775146484375, 1.13238525390625, 1.187255859375, 1.24212646484375, 1.2969970703125, 1.35186767578125, 1.40673828125, 1.46160888671875, 1.5164794921875, 1.57135009765625, 1.626220703125, 1.68109130859375, 1.7359619140625, 1.79083251953125, 1.845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 4.0, 10.0, 12.0, 20.0, 27.0, 61.0, 91.0, 174.0, 370.0, 941.0, 3478.0, 20841.0, 248409.0, 3512226.0, 373727.0, 27587.0, 4328.0, 1068.0, 406.0, 201.0, 116.0, 63.0, 45.0, 21.0, 13.0, 11.0, 11.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.65625, -45.1298828125, -43.603515625, -42.0771484375, -40.55078125, -39.0244140625, -37.498046875, -35.9716796875, -34.4453125, -32.9189453125, -31.392578125, -29.8662109375, -28.33984375, -26.8134765625, -25.287109375, -23.7607421875, -22.234375, -20.7080078125, -19.181640625, -17.6552734375, -16.12890625, -14.6025390625, -13.076171875, -11.5498046875, -10.0234375, -8.4970703125, -6.970703125, -5.4443359375, -3.91796875, -2.3916015625, -0.865234375, 0.6611328125, 2.1875, 3.7138671875, 5.240234375, 6.7666015625, 8.29296875, 9.8193359375, 11.345703125, 12.8720703125, 14.3984375, 15.9248046875, 17.451171875, 18.9775390625, 20.50390625, 22.0302734375, 23.556640625, 25.0830078125, 26.609375, 28.1357421875, 29.662109375, 31.1884765625, 32.71484375, 34.2412109375, 35.767578125, 37.2939453125, 38.8203125, 40.3466796875, 41.873046875, 43.3994140625, 44.92578125, 46.4521484375, 47.978515625, 49.5048828125, 51.03125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 13.0, 14.0, 12.0, 16.0, 28.0, 55.0, 65.0, 87.0, 122.0, 187.0, 304.0, 456.0, 865.0, 671.0, 397.0, 283.0, 159.0, 104.0, 75.0, 53.0, 27.0, 26.0, 16.0, 13.0, 6.0, 9.0, 6.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.943359375, -3.796661376953125, -3.64996337890625, -3.503265380859375, -3.3565673828125, -3.209869384765625, -3.06317138671875, -2.916473388671875, -2.769775390625, -2.623077392578125, -2.47637939453125, -2.329681396484375, -2.1829833984375, -2.036285400390625, -1.88958740234375, -1.742889404296875, -1.59619140625, -1.449493408203125, -1.30279541015625, -1.156097412109375, -1.0093994140625, -0.862701416015625, -0.71600341796875, -0.569305419921875, -0.422607421875, -0.275909423828125, -0.12921142578125, 0.017486572265625, 0.1641845703125, 0.310882568359375, 0.45758056640625, 0.604278564453125, 0.7509765625, 0.897674560546875, 1.04437255859375, 1.191070556640625, 1.3377685546875, 1.484466552734375, 1.63116455078125, 1.777862548828125, 1.924560546875, 2.071258544921875, 2.21795654296875, 2.364654541015625, 2.5113525390625, 2.658050537109375, 2.80474853515625, 2.951446533203125, 3.09814453125, 3.244842529296875, 3.39154052734375, 3.538238525390625, 3.6849365234375, 3.831634521484375, 3.97833251953125, 4.125030517578125, 4.271728515625, 4.418426513671875, 4.56512451171875, 4.711822509765625, 4.8585205078125, 5.005218505859375, 5.15191650390625, 5.298614501953125, 5.4453125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 22.0, 24.0, 73.0, 85.0, 127.0, 141.0, 166.0, 134.0, 82.0, 58.0, 33.0, 20.0, 7.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-62.87931442260742, -61.62422180175781, -60.3691291809082, -59.114036560058594, -57.85894775390625, -56.60385513305664, -55.34876251220703, -54.09366989135742, -52.83857727050781, -51.5834846496582, -50.328392028808594, -49.073299407958984, -47.818206787109375, -46.56311798095703, -45.30802536010742, -44.05293273925781, -42.7978401184082, -41.542747497558594, -40.287654876708984, -39.032562255859375, -37.77747344970703, -36.52238082885742, -35.26728820800781, -34.0121955871582, -32.757102966308594, -31.502010345458984, -30.246917724609375, -28.9918270111084, -27.73673439025879, -26.48164176940918, -25.226551055908203, -23.971458435058594, -22.71636962890625, -21.46127700805664, -20.20618438720703, -18.951093673706055, -17.696001052856445, -16.440908432006836, -15.185816764831543, -13.93072509765625, -12.67563247680664, -11.420539855957031, -10.165448188781738, -8.910356521606445, -7.655263900756836, -6.400171756744385, -5.145079612731934, -3.8899879455566406, -2.6348953247070312, -1.37980318069458, -0.1247110366821289, 1.1303811073303223, 2.3854732513427734, 3.6405653953552246, 4.895657539367676, 6.150749206542969, 7.405841827392578, 8.660934448242188, 9.91602611541748, 11.171117782592773, 12.426210403442383, 13.681303024291992, 14.936394691467285, 16.191486358642578, 17.446578979492188]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 10.0, 14.0, 11.0, 18.0, 24.0, 25.0, 26.0, 33.0, 49.0, 39.0, 49.0, 53.0, 51.0, 48.0, 46.0, 42.0, 47.0, 53.0, 42.0, 43.0, 44.0, 33.0, 31.0, 22.0, 27.0, 11.0, 25.0, 25.0, 6.0, 8.0, 11.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.885196685791016, -17.287769317626953, -16.69034194946289, -16.092914581298828, -15.495487213134766, -14.898059844970703, -14.300633430480957, -13.703206062316895, -13.105778694152832, -12.50835132598877, -11.910923957824707, -11.313496589660645, -10.716070175170898, -10.118642807006836, -9.521215438842773, -8.923788070678711, -8.326360702514648, -7.728933334350586, -7.131505966186523, -6.534079074859619, -5.936651706695557, -5.339224338531494, -4.74179744720459, -4.144370079040527, -3.546942710876465, -2.9495153427124023, -2.352088212966919, -1.754660964012146, -1.157233715057373, -0.5598063468933105, 0.03762078285217285, 0.6350479125976562, 1.2324771881103516, 1.8299044370651245, 2.4273316860198975, 3.024758815765381, 3.6221861839294434, 4.219613552093506, 4.81704044342041, 5.414467811584473, 6.011895179748535, 6.609322547912598, 7.20674991607666, 7.8041768074035645, 8.401603698730469, 8.999031066894531, 9.596458435058594, 10.193885803222656, 10.791313171386719, 11.388740539550781, 11.986167907714844, 12.583595275878906, 13.181022644042969, 13.778450012207031, 14.375876426696777, 14.97330379486084, 15.570731163024902, 16.16815757751465, 16.76558494567871, 17.363012313842773, 17.960439682006836, 18.5578670501709, 19.15529441833496, 19.752721786499023, 20.350149154663086]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 16.0, 11.0, 14.0, 19.0, 30.0, 42.0, 60.0, 116.0, 160.0, 287.0, 485.0, 945.0, 1808.0, 4038.0, 9445.0, 22800.0, 59854.0, 164536.0, 360135.0, 261821.0, 99042.0, 36726.0, 14628.0, 6085.0, 2577.0, 1305.0, 654.0, 345.0, 201.0, 120.0, 84.0, 55.0, 31.0, 17.0, 20.0, 11.0, 10.0, 6.0, 1.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.571533203125, -17.01806640625, -16.464599609375, -15.9111328125, -15.357666015625, -14.80419921875, -14.250732421875, -13.697265625, -13.143798828125, -12.59033203125, -12.036865234375, -11.4833984375, -10.929931640625, -10.37646484375, -9.822998046875, -9.26953125, -8.716064453125, -8.16259765625, -7.609130859375, -7.0556640625, -6.502197265625, -5.94873046875, -5.395263671875, -4.841796875, -4.288330078125, -3.73486328125, -3.181396484375, -2.6279296875, -2.074462890625, -1.52099609375, -0.967529296875, -0.4140625, 0.139404296875, 0.69287109375, 1.246337890625, 1.7998046875, 2.353271484375, 2.90673828125, 3.460205078125, 4.013671875, 4.567138671875, 5.12060546875, 5.674072265625, 6.2275390625, 6.781005859375, 7.33447265625, 7.887939453125, 8.44140625, 8.994873046875, 9.54833984375, 10.101806640625, 10.6552734375, 11.208740234375, 11.76220703125, 12.315673828125, 12.869140625, 13.422607421875, 13.97607421875, 14.529541015625, 15.0830078125, 15.636474609375, 16.18994140625, 16.743408203125, 17.296875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 7.0, 9.0, 7.0, 11.0, 16.0, 21.0, 35.0, 45.0, 36.0, 46.0, 57.0, 62.0, 52.0, 83.0, 66.0, 65.0, 63.0, 60.0, 36.0, 42.0, 25.0, 36.0, 32.0, 18.0, 20.0, 15.0, 8.0, 13.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4345703125, -1.3819580078125, -1.329345703125, -1.2767333984375, -1.22412109375, -1.1715087890625, -1.118896484375, -1.0662841796875, -1.013671875, -0.9610595703125, -0.908447265625, -0.8558349609375, -0.80322265625, -0.7506103515625, -0.697998046875, -0.6453857421875, -0.5927734375, -0.5401611328125, -0.487548828125, -0.4349365234375, -0.38232421875, -0.3297119140625, -0.277099609375, -0.2244873046875, -0.171875, -0.1192626953125, -0.066650390625, -0.0140380859375, 0.03857421875, 0.0911865234375, 0.143798828125, 0.1964111328125, 0.2490234375, 0.3016357421875, 0.354248046875, 0.4068603515625, 0.45947265625, 0.5120849609375, 0.564697265625, 0.6173095703125, 0.669921875, 0.7225341796875, 0.775146484375, 0.8277587890625, 0.88037109375, 0.9329833984375, 0.985595703125, 1.0382080078125, 1.0908203125, 1.1434326171875, 1.196044921875, 1.2486572265625, 1.30126953125, 1.3538818359375, 1.406494140625, 1.4591064453125, 1.51171875, 1.5643310546875, 1.616943359375, 1.6695556640625, 1.72216796875, 1.7747802734375, 1.827392578125, 1.8800048828125, 1.9326171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 9.0, 19.0, 27.0, 25.0, 63.0, 73.0, 117.0, 157.0, 262.0, 451.0, 884.0, 2022.0, 5251.0, 17182.0, 68227.0, 287011.0, 467310.0, 148265.0, 35222.0, 9779.0, 3286.0, 1320.0, 655.0, 345.0, 202.0, 139.0, 91.0, 49.0, 33.0, 25.0, 15.0, 10.0, 8.0, 8.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.96875, -29.16455078125, -28.3603515625, -27.55615234375, -26.751953125, -25.94775390625, -25.1435546875, -24.33935546875, -23.53515625, -22.73095703125, -21.9267578125, -21.12255859375, -20.318359375, -19.51416015625, -18.7099609375, -17.90576171875, -17.1015625, -16.29736328125, -15.4931640625, -14.68896484375, -13.884765625, -13.08056640625, -12.2763671875, -11.47216796875, -10.66796875, -9.86376953125, -9.0595703125, -8.25537109375, -7.451171875, -6.64697265625, -5.8427734375, -5.03857421875, -4.234375, -3.43017578125, -2.6259765625, -1.82177734375, -1.017578125, -0.21337890625, 0.5908203125, 1.39501953125, 2.19921875, 3.00341796875, 3.8076171875, 4.61181640625, 5.416015625, 6.22021484375, 7.0244140625, 7.82861328125, 8.6328125, 9.43701171875, 10.2412109375, 11.04541015625, 11.849609375, 12.65380859375, 13.4580078125, 14.26220703125, 15.06640625, 15.87060546875, 16.6748046875, 17.47900390625, 18.283203125, 19.08740234375, 19.8916015625, 20.69580078125, 21.5]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 11.0, 8.0, 16.0, 16.0, 13.0, 22.0, 29.0, 31.0, 37.0, 34.0, 43.0, 52.0, 46.0, 49.0, 42.0, 54.0, 51.0, 53.0, 55.0, 41.0, 47.0, 44.0, 41.0, 30.0, 36.0, 21.0, 17.0, 12.0, 8.0, 9.0, 8.0, 5.0, 10.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.857666015625, -10.54345703125, -10.229248046875, -9.9150390625, -9.600830078125, -9.28662109375, -8.972412109375, -8.658203125, -8.343994140625, -8.02978515625, -7.715576171875, -7.4013671875, -7.087158203125, -6.77294921875, -6.458740234375, -6.14453125, -5.830322265625, -5.51611328125, -5.201904296875, -4.8876953125, -4.573486328125, -4.25927734375, -3.945068359375, -3.630859375, -3.316650390625, -3.00244140625, -2.688232421875, -2.3740234375, -2.059814453125, -1.74560546875, -1.431396484375, -1.1171875, -0.802978515625, -0.48876953125, -0.174560546875, 0.1396484375, 0.453857421875, 0.76806640625, 1.082275390625, 1.396484375, 1.710693359375, 2.02490234375, 2.339111328125, 2.6533203125, 2.967529296875, 3.28173828125, 3.595947265625, 3.91015625, 4.224365234375, 4.53857421875, 4.852783203125, 5.1669921875, 5.481201171875, 5.79541015625, 6.109619140625, 6.423828125, 6.738037109375, 7.05224609375, 7.366455078125, 7.6806640625, 7.994873046875, 8.30908203125, 8.623291015625, 8.9375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 8.0, 1.0, 3.0, 4.0, 5.0, 10.0, 7.0, 9.0, 13.0, 14.0, 12.0, 33.0, 41.0, 62.0, 130.0, 200.0, 335.0, 592.0, 1219.0, 2589.0, 6517.0, 19300.0, 69008.0, 262591.0, 452029.0, 167878.0, 44070.0, 13146.0, 4670.0, 1927.0, 984.0, 455.0, 269.0, 150.0, 94.0, 65.0, 24.0, 28.0, 12.0, 12.0, 11.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.203125, -15.650634765625, -15.09814453125, -14.545654296875, -13.9931640625, -13.440673828125, -12.88818359375, -12.335693359375, -11.783203125, -11.230712890625, -10.67822265625, -10.125732421875, -9.5732421875, -9.020751953125, -8.46826171875, -7.915771484375, -7.36328125, -6.810791015625, -6.25830078125, -5.705810546875, -5.1533203125, -4.600830078125, -4.04833984375, -3.495849609375, -2.943359375, -2.390869140625, -1.83837890625, -1.285888671875, -0.7333984375, -0.180908203125, 0.37158203125, 0.924072265625, 1.4765625, 2.029052734375, 2.58154296875, 3.134033203125, 3.6865234375, 4.239013671875, 4.79150390625, 5.343994140625, 5.896484375, 6.448974609375, 7.00146484375, 7.553955078125, 8.1064453125, 8.658935546875, 9.21142578125, 9.763916015625, 10.31640625, 10.868896484375, 11.42138671875, 11.973876953125, 12.5263671875, 13.078857421875, 13.63134765625, 14.183837890625, 14.736328125, 15.288818359375, 15.84130859375, 16.393798828125, 16.9462890625, 17.498779296875, 18.05126953125, 18.603759765625, 19.15625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 15.0, 11.0, 13.0, 18.0, 16.0, 11.0, 40.0, 44.0, 50.0, 77.0, 65.0, 72.0, 93.0, 77.0, 72.0, 60.0, 32.0, 47.0, 30.0, 25.0, 23.0, 16.0, 11.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.001888275146484375, -0.0018323957920074463, -0.0017765164375305176, -0.0017206370830535889, -0.0016647577285766602, -0.0016088783740997314, -0.0015529990196228027, -0.001497119665145874, -0.0014412403106689453, -0.0013853609561920166, -0.0013294816017150879, -0.0012736022472381592, -0.0012177228927612305, -0.0011618435382843018, -0.001105964183807373, -0.0010500848293304443, -0.0009942054748535156, -0.0009383261203765869, -0.0008824467658996582, -0.0008265674114227295, -0.0007706880569458008, -0.0007148087024688721, -0.0006589293479919434, -0.0006030499935150146, -0.0005471706390380859, -0.0004912912845611572, -0.0004354119300842285, -0.0003795325756072998, -0.0003236532211303711, -0.0002677738666534424, -0.00021189451217651367, -0.00015601515769958496, -0.00010013580322265625, -4.425644874572754e-05, 1.1622905731201172e-05, 6.750226020812988e-05, 0.0001233816146850586, 0.0001792609691619873, 0.00023514032363891602, 0.0002910196781158447, 0.00034689903259277344, 0.00040277838706970215, 0.00045865774154663086, 0.0005145370960235596, 0.0005704164505004883, 0.000626295804977417, 0.0006821751594543457, 0.0007380545139312744, 0.0007939338684082031, 0.0008498132228851318, 0.0009056925773620605, 0.0009615719318389893, 0.001017451286315918, 0.0010733306407928467, 0.0011292099952697754, 0.001185089349746704, 0.0012409687042236328, 0.0012968480587005615, 0.0013527274131774902, 0.001408606767654419, 0.0014644861221313477, 0.0015203654766082764, 0.001576244831085205, 0.0016321241855621338, 0.0016880035400390625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 20.0, 14.0, 27.0, 23.0, 53.0, 57.0, 95.0, 145.0, 196.0, 347.0, 542.0, 976.0, 1798.0, 3676.0, 8680.0, 22346.0, 67334.0, 235181.0, 450435.0, 173766.0, 51341.0, 17517.0, 6928.0, 3191.0, 1555.0, 803.0, 490.0, 330.0, 203.0, 147.0, 94.0, 68.0, 41.0, 30.0, 19.0, 19.0, 14.0, 7.0, 3.0, 8.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-18.109375, -17.5975341796875, -17.085693359375, -16.5738525390625, -16.06201171875, -15.5501708984375, -15.038330078125, -14.5264892578125, -14.0146484375, -13.5028076171875, -12.990966796875, -12.4791259765625, -11.96728515625, -11.4554443359375, -10.943603515625, -10.4317626953125, -9.919921875, -9.4080810546875, -8.896240234375, -8.3843994140625, -7.87255859375, -7.3607177734375, -6.848876953125, -6.3370361328125, -5.8251953125, -5.3133544921875, -4.801513671875, -4.2896728515625, -3.77783203125, -3.2659912109375, -2.754150390625, -2.2423095703125, -1.73046875, -1.2186279296875, -0.706787109375, -0.1949462890625, 0.31689453125, 0.8287353515625, 1.340576171875, 1.8524169921875, 2.3642578125, 2.8760986328125, 3.387939453125, 3.8997802734375, 4.41162109375, 4.9234619140625, 5.435302734375, 5.9471435546875, 6.458984375, 6.9708251953125, 7.482666015625, 7.9945068359375, 8.50634765625, 9.0181884765625, 9.530029296875, 10.0418701171875, 10.5537109375, 11.0655517578125, 11.577392578125, 12.0892333984375, 12.60107421875, 13.1129150390625, 13.624755859375, 14.1365966796875, 14.6484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 7.0, 3.0, 6.0, 13.0, 11.0, 20.0, 22.0, 11.0, 16.0, 32.0, 39.0, 56.0, 55.0, 55.0, 83.0, 74.0, 69.0, 62.0, 73.0, 49.0, 53.0, 25.0, 21.0, 23.0, 23.0, 26.0, 25.0, 13.0, 4.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.1875, -7.9222412109375, -7.656982421875, -7.3917236328125, -7.12646484375, -6.8612060546875, -6.595947265625, -6.3306884765625, -6.0654296875, -5.8001708984375, -5.534912109375, -5.2696533203125, -5.00439453125, -4.7391357421875, -4.473876953125, -4.2086181640625, -3.943359375, -3.6781005859375, -3.412841796875, -3.1475830078125, -2.88232421875, -2.6170654296875, -2.351806640625, -2.0865478515625, -1.8212890625, -1.5560302734375, -1.290771484375, -1.0255126953125, -0.76025390625, -0.4949951171875, -0.229736328125, 0.0355224609375, 0.30078125, 0.5660400390625, 0.831298828125, 1.0965576171875, 1.36181640625, 1.6270751953125, 1.892333984375, 2.1575927734375, 2.4228515625, 2.6881103515625, 2.953369140625, 3.2186279296875, 3.48388671875, 3.7491455078125, 4.014404296875, 4.2796630859375, 4.544921875, 4.8101806640625, 5.075439453125, 5.3406982421875, 5.60595703125, 5.8712158203125, 6.136474609375, 6.4017333984375, 6.6669921875, 6.9322509765625, 7.197509765625, 7.4627685546875, 7.72802734375, 7.9932861328125, 8.258544921875, 8.5238037109375, 8.7890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 13.0, 27.0, 67.0, 181.0, 295.0, 223.0, 123.0, 41.0, 21.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-321.84857177734375, -312.315673828125, -302.7828063964844, -293.2499084472656, -283.7170104980469, -274.1841125488281, -264.6512451171875, -255.11834716796875, -245.58544921875, -236.0525665283203, -226.51966857910156, -216.98678588867188, -207.45388793945312, -197.92100524902344, -188.38812255859375, -178.855224609375, -169.3223419189453, -159.78945922851562, -150.25656127929688, -140.7236785888672, -131.19078063964844, -121.65789794921875, -112.12500762939453, -102.59211730957031, -93.0592269897461, -83.52633666992188, -73.99344635009766, -64.46055603027344, -54.927669525146484, -45.394779205322266, -35.86189270019531, -26.329002380371094, -16.796112060546875, -7.263222694396973, 2.2696666717529297, 11.802555084228516, 21.335445404052734, 30.868335723876953, 40.401222229003906, 49.934112548828125, 59.467002868652344, 68.99989318847656, 78.53278350830078, 88.065673828125, 97.59855651855469, 107.13145446777344, 116.66433715820312, 126.19722747802734, 135.73011779785156, 145.26300048828125, 154.7958984375, 164.3287811279297, 173.86167907714844, 183.39456176757812, 192.92745971679688, 202.46034240722656, 211.99322509765625, 221.52610778808594, 231.0590057373047, 240.59188842773438, 250.12478637695312, 259.6576843261719, 269.1905517578125, 278.72344970703125, 288.25634765625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 10.0, 7.0, 13.0, 7.0, 16.0, 11.0, 15.0, 21.0, 22.0, 23.0, 30.0, 35.0, 39.0, 30.0, 49.0, 44.0, 45.0, 37.0, 42.0, 42.0, 46.0, 47.0, 36.0, 37.0, 41.0, 33.0, 31.0, 34.0, 22.0, 19.0, 18.0, 14.0, 9.0, 13.0, 10.0, 9.0, 7.0, 10.0, 5.0, 7.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-59.08879852294922, -57.03484344482422, -54.98088836669922, -52.92693328857422, -50.87297821044922, -48.81902313232422, -46.76506423950195, -44.71110916137695, -42.65715408325195, -40.60319900512695, -38.54924392700195, -36.49528884887695, -34.44132995605469, -32.38737487792969, -30.333419799804688, -28.279464721679688, -26.225509643554688, -24.171554565429688, -22.117599487304688, -20.063642501831055, -18.009687423706055, -15.955732345581055, -13.901776313781738, -11.847820281982422, -9.793865203857422, -7.739909648895264, -5.6859540939331055, -3.6319985389709473, -1.578042984008789, 0.47591209411621094, 2.5298681259155273, 4.583824157714844, 6.6377716064453125, 8.691726684570312, 10.745682716369629, 12.799638748168945, 14.853593826293945, 16.907548904418945, 18.961505889892578, 21.015460968017578, 23.069416046142578, 25.123371124267578, 27.177326202392578, 29.23128318786621, 31.28523826599121, 33.339195251464844, 35.393150329589844, 37.447105407714844, 39.501060485839844, 41.555015563964844, 43.608970642089844, 45.662925720214844, 47.716880798339844, 49.770835876464844, 51.82479476928711, 53.87874984741211, 55.93270492553711, 57.98666000366211, 60.04061508178711, 62.09457015991211, 64.14852905273438, 66.20248413085938, 68.25643920898438, 70.31039428710938, 72.36434936523438]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 5.0, 11.0, 12.0, 10.0, 15.0, 26.0, 28.0, 52.0, 91.0, 96.0, 157.0, 255.0, 413.0, 765.0, 1309.0, 2457.0, 5030.0, 11114.0, 26994.0, 75214.0, 270423.0, 2748741.0, 811358.0, 153873.0, 49133.0, 18857.0, 8379.0, 4086.0, 2091.0, 1147.0, 671.0, 472.0, 311.0, 206.0, 138.0, 88.0, 71.0, 42.0, 33.0, 16.0, 17.0, 11.0, 12.0, 18.0, 6.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-21.609375, -20.88427734375, -20.1591796875, -19.43408203125, -18.708984375, -17.98388671875, -17.2587890625, -16.53369140625, -15.80859375, -15.08349609375, -14.3583984375, -13.63330078125, -12.908203125, -12.18310546875, -11.4580078125, -10.73291015625, -10.0078125, -9.28271484375, -8.5576171875, -7.83251953125, -7.107421875, -6.38232421875, -5.6572265625, -4.93212890625, -4.20703125, -3.48193359375, -2.7568359375, -2.03173828125, -1.306640625, -0.58154296875, 0.1435546875, 0.86865234375, 1.59375, 2.31884765625, 3.0439453125, 3.76904296875, 4.494140625, 5.21923828125, 5.9443359375, 6.66943359375, 7.39453125, 8.11962890625, 8.8447265625, 9.56982421875, 10.294921875, 11.02001953125, 11.7451171875, 12.47021484375, 13.1953125, 13.92041015625, 14.6455078125, 15.37060546875, 16.095703125, 16.82080078125, 17.5458984375, 18.27099609375, 18.99609375, 19.72119140625, 20.4462890625, 21.17138671875, 21.896484375, 22.62158203125, 23.3466796875, 24.07177734375, 24.796875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 6.0, 3.0, 10.0, 14.0, 9.0, 25.0, 23.0, 30.0, 33.0, 41.0, 47.0, 41.0, 41.0, 53.0, 58.0, 64.0, 48.0, 60.0, 40.0, 53.0, 53.0, 45.0, 33.0, 39.0, 22.0, 19.0, 15.0, 11.0, 16.0, 11.0, 4.0, 8.0, 8.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6566619873046875, -1.595550537109375, -1.5344390869140625, -1.47332763671875, -1.4122161865234375, -1.351104736328125, -1.2899932861328125, -1.2288818359375, -1.1677703857421875, -1.106658935546875, -1.0455474853515625, -0.98443603515625, -0.9233245849609375, -0.862213134765625, -0.8011016845703125, -0.739990234375, -0.6788787841796875, -0.617767333984375, -0.5566558837890625, -0.49554443359375, -0.4344329833984375, -0.373321533203125, -0.3122100830078125, -0.2510986328125, -0.1899871826171875, -0.128875732421875, -0.0677642822265625, -0.00665283203125, 0.0544586181640625, 0.115570068359375, 0.1766815185546875, 0.23779296875, 0.2989044189453125, 0.360015869140625, 0.4211273193359375, 0.48223876953125, 0.5433502197265625, 0.604461669921875, 0.6655731201171875, 0.7266845703125, 0.7877960205078125, 0.848907470703125, 0.9100189208984375, 0.97113037109375, 1.0322418212890625, 1.093353271484375, 1.1544647216796875, 1.215576171875, 1.2766876220703125, 1.337799072265625, 1.3989105224609375, 1.46002197265625, 1.5211334228515625, 1.582244873046875, 1.6433563232421875, 1.7044677734375, 1.7655792236328125, 1.826690673828125, 1.8878021240234375, 1.94891357421875, 2.0100250244140625, 2.071136474609375, 2.1322479248046875, 2.193359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 14.0, 16.0, 16.0, 22.0, 55.0, 76.0, 116.0, 172.0, 310.0, 496.0, 905.0, 1612.0, 3267.0, 6985.0, 17693.0, 52318.0, 201869.0, 1362243.0, 2202213.0, 247301.0, 61260.0, 19933.0, 7835.0, 3485.0, 1722.0, 952.0, 548.0, 310.0, 187.0, 121.0, 62.0, 48.0, 32.0, 19.0, 7.0, 15.0, 14.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-29.578125, -28.68359375, -27.7890625, -26.89453125, -26.0, -25.10546875, -24.2109375, -23.31640625, -22.421875, -21.52734375, -20.6328125, -19.73828125, -18.84375, -17.94921875, -17.0546875, -16.16015625, -15.265625, -14.37109375, -13.4765625, -12.58203125, -11.6875, -10.79296875, -9.8984375, -9.00390625, -8.109375, -7.21484375, -6.3203125, -5.42578125, -4.53125, -3.63671875, -2.7421875, -1.84765625, -0.953125, -0.05859375, 0.8359375, 1.73046875, 2.625, 3.51953125, 4.4140625, 5.30859375, 6.203125, 7.09765625, 7.9921875, 8.88671875, 9.78125, 10.67578125, 11.5703125, 12.46484375, 13.359375, 14.25390625, 15.1484375, 16.04296875, 16.9375, 17.83203125, 18.7265625, 19.62109375, 20.515625, 21.41015625, 22.3046875, 23.19921875, 24.09375, 24.98828125, 25.8828125, 26.77734375, 27.671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 14.0, 15.0, 20.0, 37.0, 53.0, 72.0, 102.0, 114.0, 229.0, 323.0, 622.0, 1156.0, 429.0, 297.0, 171.0, 115.0, 80.0, 51.0, 49.0, 18.0, 18.0, 19.0, 7.0, 6.0, 5.0, 11.0, 10.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.44140625, -7.2305908203125, -7.019775390625, -6.8089599609375, -6.59814453125, -6.3873291015625, -6.176513671875, -5.9656982421875, -5.7548828125, -5.5440673828125, -5.333251953125, -5.1224365234375, -4.91162109375, -4.7008056640625, -4.489990234375, -4.2791748046875, -4.068359375, -3.8575439453125, -3.646728515625, -3.4359130859375, -3.22509765625, -3.0142822265625, -2.803466796875, -2.5926513671875, -2.3818359375, -2.1710205078125, -1.960205078125, -1.7493896484375, -1.53857421875, -1.3277587890625, -1.116943359375, -0.9061279296875, -0.6953125, -0.4844970703125, -0.273681640625, -0.0628662109375, 0.14794921875, 0.3587646484375, 0.569580078125, 0.7803955078125, 0.9912109375, 1.2020263671875, 1.412841796875, 1.6236572265625, 1.83447265625, 2.0452880859375, 2.256103515625, 2.4669189453125, 2.677734375, 2.8885498046875, 3.099365234375, 3.3101806640625, 3.52099609375, 3.7318115234375, 3.942626953125, 4.1534423828125, 4.3642578125, 4.5750732421875, 4.785888671875, 4.9967041015625, 5.20751953125, 5.4183349609375, 5.629150390625, 5.8399658203125, 6.05078125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 11.0, 18.0, 19.0, 86.0, 191.0, 267.0, 213.0, 120.0, 56.0, 15.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-160.84622192382812, -157.54103088378906, -154.23583984375, -150.9306640625, -147.62547302246094, -144.32028198242188, -141.0150909423828, -137.70989990234375, -134.4047088623047, -131.09951782226562, -127.7943344116211, -124.48914337158203, -121.18395233154297, -117.87876892089844, -114.57357788085938, -111.26838684082031, -107.96321105957031, -104.65802001953125, -101.35283660888672, -98.04764556884766, -94.7424545288086, -91.43727111816406, -88.132080078125, -84.82688903808594, -81.52169799804688, -78.21650695800781, -74.91132354736328, -71.60613250732422, -68.30094146728516, -64.99575805664062, -61.69056701660156, -58.385379791259766, -55.08019256591797, -51.77500534057617, -48.46981430053711, -45.16462707519531, -41.859439849853516, -38.55425262451172, -35.249061584472656, -31.94387435913086, -28.63868522644043, -25.33349609375, -22.028308868408203, -18.723119735717773, -15.41793155670166, -12.112743377685547, -8.807554244995117, -5.50236701965332, -2.1971778869628906, 1.1080105304718018, 4.413198947906494, 7.718387603759766, 11.023575782775879, 14.328763961791992, 17.633953094482422, 20.93914031982422, 24.24432945251465, 27.549518585205078, 30.854705810546875, 34.15989685058594, 37.465084075927734, 40.77027130126953, 44.075462341308594, 47.380645751953125, 50.68583679199219]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 8.0, 5.0, 11.0, 8.0, 7.0, 9.0, 7.0, 15.0, 20.0, 27.0, 18.0, 19.0, 28.0, 38.0, 22.0, 41.0, 41.0, 41.0, 33.0, 52.0, 46.0, 41.0, 45.0, 34.0, 38.0, 26.0, 36.0, 35.0, 39.0, 30.0, 24.0, 23.0, 18.0, 17.0, 16.0, 16.0, 12.0, 8.0, 7.0, 7.0, 4.0, 2.0, 6.0, 3.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-24.859554290771484, -24.095962524414062, -23.332368850708008, -22.568777084350586, -21.80518341064453, -21.04159164428711, -20.277999877929688, -19.514408111572266, -18.75081443786621, -17.98722267150879, -17.223628997802734, -16.460037231445312, -15.696444511413574, -14.932851791381836, -14.169260025024414, -13.405667304992676, -12.642074584960938, -11.8784818649292, -11.114889144897461, -10.351297378540039, -9.5877046585083, -8.824111938476562, -8.06052017211914, -7.296927452087402, -6.533334732055664, -5.769742012023926, -5.006149768829346, -4.242557525634766, -3.4789648056030273, -2.715372323989868, -1.951779842376709, -1.188187599182129, -0.4245948791503906, 0.33899760246276855, 1.1025900840759277, 1.866182565689087, 2.629775047302246, 3.3933675289154053, 4.1569600105285645, 4.9205522537231445, 5.684144973754883, 6.447737693786621, 7.211329936981201, 7.974922180175781, 8.73851490020752, 9.502107620239258, 10.26569938659668, 11.029292106628418, 11.792884826660156, 12.556477546691895, 13.320070266723633, 14.083662033081055, 14.847254753112793, 15.610847473144531, 16.374439239501953, 17.138031005859375, 17.90162467956543, 18.66521644592285, 19.428810119628906, 20.192401885986328, 20.95599365234375, 21.719587326049805, 22.483179092407227, 23.24677276611328, 24.010364532470703]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 12.0, 20.0, 23.0, 27.0, 38.0, 58.0, 106.0, 159.0, 206.0, 358.0, 662.0, 1174.0, 2118.0, 4373.0, 8855.0, 19203.0, 40406.0, 85325.0, 172143.0, 272525.0, 219916.0, 115239.0, 55266.0, 26025.0, 12226.0, 5782.0, 2828.0, 1419.0, 795.0, 428.0, 295.0, 175.0, 125.0, 58.0, 54.0, 32.0, 21.0, 25.0, 15.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.90625, -13.453369140625, -13.00048828125, -12.547607421875, -12.0947265625, -11.641845703125, -11.18896484375, -10.736083984375, -10.283203125, -9.830322265625, -9.37744140625, -8.924560546875, -8.4716796875, -8.018798828125, -7.56591796875, -7.113037109375, -6.66015625, -6.207275390625, -5.75439453125, -5.301513671875, -4.8486328125, -4.395751953125, -3.94287109375, -3.489990234375, -3.037109375, -2.584228515625, -2.13134765625, -1.678466796875, -1.2255859375, -0.772705078125, -0.31982421875, 0.133056640625, 0.5859375, 1.038818359375, 1.49169921875, 1.944580078125, 2.3974609375, 2.850341796875, 3.30322265625, 3.756103515625, 4.208984375, 4.661865234375, 5.11474609375, 5.567626953125, 6.0205078125, 6.473388671875, 6.92626953125, 7.379150390625, 7.83203125, 8.284912109375, 8.73779296875, 9.190673828125, 9.6435546875, 10.096435546875, 10.54931640625, 11.002197265625, 11.455078125, 11.907958984375, 12.36083984375, 12.813720703125, 13.2666015625, 13.719482421875, 14.17236328125, 14.625244140625, 15.078125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 11.0, 9.0, 15.0, 16.0, 18.0, 20.0, 22.0, 23.0, 31.0, 25.0, 48.0, 60.0, 54.0, 42.0, 53.0, 49.0, 52.0, 41.0, 49.0, 51.0, 40.0, 41.0, 30.0, 28.0, 34.0, 21.0, 27.0, 12.0, 11.0, 14.0, 8.0, 11.0, 9.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7841796875, -1.7180023193359375, -1.651824951171875, -1.5856475830078125, -1.51947021484375, -1.4532928466796875, -1.387115478515625, -1.3209381103515625, -1.2547607421875, -1.1885833740234375, -1.122406005859375, -1.0562286376953125, -0.99005126953125, -0.9238739013671875, -0.857696533203125, -0.7915191650390625, -0.725341796875, -0.6591644287109375, -0.592987060546875, -0.5268096923828125, -0.46063232421875, -0.3944549560546875, -0.328277587890625, -0.2621002197265625, -0.1959228515625, -0.1297454833984375, -0.063568115234375, 0.0026092529296875, 0.06878662109375, 0.1349639892578125, 0.201141357421875, 0.2673187255859375, 0.33349609375, 0.3996734619140625, 0.465850830078125, 0.5320281982421875, 0.59820556640625, 0.6643829345703125, 0.730560302734375, 0.7967376708984375, 0.8629150390625, 0.9290924072265625, 0.995269775390625, 1.0614471435546875, 1.12762451171875, 1.1938018798828125, 1.259979248046875, 1.3261566162109375, 1.392333984375, 1.4585113525390625, 1.524688720703125, 1.5908660888671875, 1.65704345703125, 1.7232208251953125, 1.789398193359375, 1.8555755615234375, 1.9217529296875, 1.9879302978515625, 2.054107666015625, 2.1202850341796875, 2.18646240234375, 2.2526397705078125, 2.318817138671875, 2.3849945068359375, 2.451171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 4.0, 10.0, 16.0, 31.0, 37.0, 26.0, 55.0, 76.0, 117.0, 137.0, 186.0, 330.0, 447.0, 843.0, 1564.0, 3232.0, 7495.0, 19161.0, 54524.0, 160508.0, 411584.0, 253172.0, 85230.0, 29583.0, 10796.0, 4553.0, 2050.0, 1007.0, 604.0, 360.0, 252.0, 164.0, 101.0, 83.0, 50.0, 45.0, 29.0, 19.0, 18.0, 17.0, 10.0, 11.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.1875, -22.406982421875, -21.62646484375, -20.845947265625, -20.0654296875, -19.284912109375, -18.50439453125, -17.723876953125, -16.943359375, -16.162841796875, -15.38232421875, -14.601806640625, -13.8212890625, -13.040771484375, -12.26025390625, -11.479736328125, -10.69921875, -9.918701171875, -9.13818359375, -8.357666015625, -7.5771484375, -6.796630859375, -6.01611328125, -5.235595703125, -4.455078125, -3.674560546875, -2.89404296875, -2.113525390625, -1.3330078125, -0.552490234375, 0.22802734375, 1.008544921875, 1.7890625, 2.569580078125, 3.35009765625, 4.130615234375, 4.9111328125, 5.691650390625, 6.47216796875, 7.252685546875, 8.033203125, 8.813720703125, 9.59423828125, 10.374755859375, 11.1552734375, 11.935791015625, 12.71630859375, 13.496826171875, 14.27734375, 15.057861328125, 15.83837890625, 16.618896484375, 17.3994140625, 18.179931640625, 18.96044921875, 19.740966796875, 20.521484375, 21.302001953125, 22.08251953125, 22.863037109375, 23.6435546875, 24.424072265625, 25.20458984375, 25.985107421875, 26.765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 8.0, 6.0, 6.0, 6.0, 11.0, 12.0, 13.0, 19.0, 24.0, 24.0, 29.0, 31.0, 26.0, 39.0, 35.0, 39.0, 36.0, 53.0, 56.0, 42.0, 56.0, 43.0, 36.0, 45.0, 32.0, 42.0, 29.0, 34.0, 33.0, 20.0, 27.0, 14.0, 12.0, 8.0, 14.0, 6.0, 6.0, 6.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.734375, -12.2916259765625, -11.848876953125, -11.4061279296875, -10.96337890625, -10.5206298828125, -10.077880859375, -9.6351318359375, -9.1923828125, -8.7496337890625, -8.306884765625, -7.8641357421875, -7.42138671875, -6.9786376953125, -6.535888671875, -6.0931396484375, -5.650390625, -5.2076416015625, -4.764892578125, -4.3221435546875, -3.87939453125, -3.4366455078125, -2.993896484375, -2.5511474609375, -2.1083984375, -1.6656494140625, -1.222900390625, -0.7801513671875, -0.33740234375, 0.1053466796875, 0.548095703125, 0.9908447265625, 1.43359375, 1.8763427734375, 2.319091796875, 2.7618408203125, 3.20458984375, 3.6473388671875, 4.090087890625, 4.5328369140625, 4.9755859375, 5.4183349609375, 5.861083984375, 6.3038330078125, 6.74658203125, 7.1893310546875, 7.632080078125, 8.0748291015625, 8.517578125, 8.9603271484375, 9.403076171875, 9.8458251953125, 10.28857421875, 10.7313232421875, 11.174072265625, 11.6168212890625, 12.0595703125, 12.5023193359375, 12.945068359375, 13.3878173828125, 13.83056640625, 14.2733154296875, 14.716064453125, 15.1588134765625, 15.6015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 10.0, 22.0, 13.0, 16.0, 34.0, 55.0, 77.0, 143.0, 239.0, 455.0, 896.0, 2099.0, 4831.0, 12808.0, 39943.0, 152448.0, 532489.0, 220625.0, 53768.0, 16613.0, 6178.0, 2485.0, 1072.0, 534.0, 265.0, 141.0, 86.0, 70.0, 38.0, 23.0, 27.0, 15.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.03125, -19.45263671875, -18.8740234375, -18.29541015625, -17.716796875, -17.13818359375, -16.5595703125, -15.98095703125, -15.40234375, -14.82373046875, -14.2451171875, -13.66650390625, -13.087890625, -12.50927734375, -11.9306640625, -11.35205078125, -10.7734375, -10.19482421875, -9.6162109375, -9.03759765625, -8.458984375, -7.88037109375, -7.3017578125, -6.72314453125, -6.14453125, -5.56591796875, -4.9873046875, -4.40869140625, -3.830078125, -3.25146484375, -2.6728515625, -2.09423828125, -1.515625, -0.93701171875, -0.3583984375, 0.22021484375, 0.798828125, 1.37744140625, 1.9560546875, 2.53466796875, 3.11328125, 3.69189453125, 4.2705078125, 4.84912109375, 5.427734375, 6.00634765625, 6.5849609375, 7.16357421875, 7.7421875, 8.32080078125, 8.8994140625, 9.47802734375, 10.056640625, 10.63525390625, 11.2138671875, 11.79248046875, 12.37109375, 12.94970703125, 13.5283203125, 14.10693359375, 14.685546875, 15.26416015625, 15.8427734375, 16.42138671875, 17.0]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 6.0, 19.0, 13.0, 23.0, 29.0, 21.0, 42.0, 39.0, 64.0, 96.0, 178.0, 140.0, 69.0, 53.0, 41.0, 26.0, 21.0, 19.0, 19.0, 7.0, 17.0, 7.0, 11.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0037059783935546875, -0.003614872694015503, -0.0035237669944763184, -0.003432661294937134, -0.0033415555953979492, -0.0032504498958587646, -0.00315934419631958, -0.0030682384967803955, -0.002977132797241211, -0.0028860270977020264, -0.002794921398162842, -0.0027038156986236572, -0.0026127099990844727, -0.002521604299545288, -0.0024304986000061035, -0.002339392900466919, -0.0022482872009277344, -0.00215718150138855, -0.0020660758018493652, -0.0019749701023101807, -0.001883864402770996, -0.0017927587032318115, -0.001701653003692627, -0.0016105473041534424, -0.0015194416046142578, -0.0014283359050750732, -0.0013372302055358887, -0.001246124505996704, -0.0011550188064575195, -0.001063913106918335, -0.0009728074073791504, -0.0008817017078399658, -0.0007905960083007812, -0.0006994903087615967, -0.0006083846092224121, -0.0005172789096832275, -0.00042617321014404297, -0.0003350675106048584, -0.00024396181106567383, -0.00015285611152648926, -6.175041198730469e-05, 2.9355287551879883e-05, 0.00012046098709106445, 0.00021156668663024902, 0.0003026723861694336, 0.00039377808570861816, 0.00048488378524780273, 0.0005759894847869873, 0.0006670951843261719, 0.0007582008838653564, 0.000849306583404541, 0.0009404122829437256, 0.0010315179824829102, 0.0011226236820220947, 0.0012137293815612793, 0.0013048350811004639, 0.0013959407806396484, 0.001487046480178833, 0.0015781521797180176, 0.0016692578792572021, 0.0017603635787963867, 0.0018514692783355713, 0.0019425749778747559, 0.0020336806774139404, 0.002124786376953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 12.0, 14.0, 17.0, 19.0, 35.0, 49.0, 69.0, 75.0, 123.0, 170.0, 274.0, 477.0, 805.0, 1469.0, 2925.0, 5893.0, 13675.0, 35363.0, 113014.0, 471695.0, 288496.0, 69825.0, 24111.0, 10000.0, 4588.0, 2233.0, 1185.0, 636.0, 399.0, 248.0, 187.0, 110.0, 91.0, 52.0, 51.0, 39.0, 32.0, 25.0, 15.0, 14.0, 10.0, 10.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.25, -18.6806640625, -18.111328125, -17.5419921875, -16.97265625, -16.4033203125, -15.833984375, -15.2646484375, -14.6953125, -14.1259765625, -13.556640625, -12.9873046875, -12.41796875, -11.8486328125, -11.279296875, -10.7099609375, -10.140625, -9.5712890625, -9.001953125, -8.4326171875, -7.86328125, -7.2939453125, -6.724609375, -6.1552734375, -5.5859375, -5.0166015625, -4.447265625, -3.8779296875, -3.30859375, -2.7392578125, -2.169921875, -1.6005859375, -1.03125, -0.4619140625, 0.107421875, 0.6767578125, 1.24609375, 1.8154296875, 2.384765625, 2.9541015625, 3.5234375, 4.0927734375, 4.662109375, 5.2314453125, 5.80078125, 6.3701171875, 6.939453125, 7.5087890625, 8.078125, 8.6474609375, 9.216796875, 9.7861328125, 10.35546875, 10.9248046875, 11.494140625, 12.0634765625, 12.6328125, 13.2021484375, 13.771484375, 14.3408203125, 14.91015625, 15.4794921875, 16.048828125, 16.6181640625, 17.1875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 10.0, 6.0, 6.0, 11.0, 12.0, 15.0, 17.0, 32.0, 25.0, 28.0, 40.0, 59.0, 77.0, 87.0, 113.0, 78.0, 74.0, 58.0, 57.0, 34.0, 18.0, 20.0, 17.0, 13.0, 11.0, 9.0, 11.0, 5.0, 7.0, 9.0, 3.0, 4.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.6197509765625, -9.270751953125, -8.9217529296875, -8.57275390625, -8.2237548828125, -7.874755859375, -7.5257568359375, -7.1767578125, -6.8277587890625, -6.478759765625, -6.1297607421875, -5.78076171875, -5.4317626953125, -5.082763671875, -4.7337646484375, -4.384765625, -4.0357666015625, -3.686767578125, -3.3377685546875, -2.98876953125, -2.6397705078125, -2.290771484375, -1.9417724609375, -1.5927734375, -1.2437744140625, -0.894775390625, -0.5457763671875, -0.19677734375, 0.1522216796875, 0.501220703125, 0.8502197265625, 1.19921875, 1.5482177734375, 1.897216796875, 2.2462158203125, 2.59521484375, 2.9442138671875, 3.293212890625, 3.6422119140625, 3.9912109375, 4.3402099609375, 4.689208984375, 5.0382080078125, 5.38720703125, 5.7362060546875, 6.085205078125, 6.4342041015625, 6.783203125, 7.1322021484375, 7.481201171875, 7.8302001953125, 8.17919921875, 8.5281982421875, 8.877197265625, 9.2261962890625, 9.5751953125, 9.9241943359375, 10.273193359375, 10.6221923828125, 10.97119140625, 11.3201904296875, 11.669189453125, 12.0181884765625, 12.3671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 12.0, 17.0, 33.0, 37.0, 45.0, 78.0, 97.0, 111.0, 133.0, 108.0, 87.0, 75.0, 58.0, 31.0, 26.0, 21.0, 6.0, 2.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.860107421875, -131.72422790527344, -126.58834838867188, -121.45246887207031, -116.31658935546875, -111.18070983886719, -106.04483032226562, -100.90895080566406, -95.7730712890625, -90.63719177246094, -85.50131225585938, -80.36543273925781, -75.22955322265625, -70.09367370605469, -64.95779418945312, -59.82191467285156, -54.68603515625, -49.55015563964844, -44.414276123046875, -39.27839660644531, -34.14251708984375, -29.006637573242188, -23.870758056640625, -18.734878540039062, -13.5989990234375, -8.463119506835938, -3.327239990234375, 1.8086395263671875, 6.94451904296875, 12.080398559570312, 17.216278076171875, 22.352157592773438, 27.488037109375, 32.62391662597656, 37.759796142578125, 42.89567565917969, 48.03155517578125, 53.16743469238281, 58.303314208984375, 63.43919372558594, 68.5750732421875, 73.71095275878906, 78.84683227539062, 83.98271179199219, 89.11859130859375, 94.25447082519531, 99.39035034179688, 104.52622985839844, 109.662109375, 114.79798889160156, 119.93386840820312, 125.06974792480469, 130.20562744140625, 135.3415069580078, 140.47738647460938, 145.61326599121094, 150.7491455078125, 155.88502502441406, 161.02090454101562, 166.1567840576172, 171.29266357421875, 176.4285430908203, 181.56442260742188, 186.70030212402344, 191.836181640625]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 5.0, 8.0, 5.0, 9.0, 7.0, 17.0, 14.0, 11.0, 19.0, 22.0, 16.0, 25.0, 22.0, 32.0, 34.0, 29.0, 31.0, 35.0, 37.0, 33.0, 43.0, 55.0, 43.0, 36.0, 42.0, 30.0, 33.0, 26.0, 41.0, 35.0, 41.0, 21.0, 20.0, 19.0, 19.0, 23.0, 15.0, 7.0, 8.0, 7.0, 7.0, 2.0, 9.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-95.60684967041016, -92.68412017822266, -89.76139068603516, -86.83865356445312, -83.91592407226562, -80.99319458007812, -78.07046508789062, -75.14773559570312, -72.22500610351562, -69.30227661132812, -66.37954711914062, -63.45681381225586, -60.53408432006836, -57.611351013183594, -54.688621520996094, -51.765892028808594, -48.84315872192383, -45.92042922973633, -42.99769592285156, -40.07496643066406, -37.15223693847656, -34.22950744628906, -31.306774139404297, -28.384044647216797, -25.461313247680664, -22.53858184814453, -19.61585235595703, -16.6931209564209, -13.770390510559082, -10.847660064697266, -7.924928665161133, -5.002199172973633, -2.0794677734375, 0.8432629108428955, 3.765993595123291, 6.688724517822266, 9.611454963684082, 12.534185409545898, 15.456916809082031, 18.37964630126953, 21.302377700805664, 24.225109100341797, 27.147838592529297, 30.07056999206543, 32.99330139160156, 35.91603088378906, 38.83876037597656, 41.76148986816406, 44.68422317504883, 47.60695266723633, 50.529685974121094, 53.452415466308594, 56.375144958496094, 59.297874450683594, 62.22060775756836, 65.14334106445312, 68.06607055664062, 70.98880004882812, 73.91152954101562, 76.83425903320312, 79.75699615478516, 82.67972564697266, 85.60245513916016, 88.52518463134766, 91.44791412353516]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 7.0, 12.0, 25.0, 22.0, 49.0, 97.0, 151.0, 263.0, 463.0, 850.0, 1923.0, 4241.0, 9888.0, 26133.0, 80999.0, 364395.0, 3272353.0, 318958.0, 73323.0, 23745.0, 8847.0, 3751.0, 1735.0, 911.0, 447.0, 284.0, 154.0, 89.0, 58.0, 35.0, 20.0, 17.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.765625, -23.01025390625, -22.2548828125, -21.49951171875, -20.744140625, -19.98876953125, -19.2333984375, -18.47802734375, -17.72265625, -16.96728515625, -16.2119140625, -15.45654296875, -14.701171875, -13.94580078125, -13.1904296875, -12.43505859375, -11.6796875, -10.92431640625, -10.1689453125, -9.41357421875, -8.658203125, -7.90283203125, -7.1474609375, -6.39208984375, -5.63671875, -4.88134765625, -4.1259765625, -3.37060546875, -2.615234375, -1.85986328125, -1.1044921875, -0.34912109375, 0.40625, 1.16162109375, 1.9169921875, 2.67236328125, 3.427734375, 4.18310546875, 4.9384765625, 5.69384765625, 6.44921875, 7.20458984375, 7.9599609375, 8.71533203125, 9.470703125, 10.22607421875, 10.9814453125, 11.73681640625, 12.4921875, 13.24755859375, 14.0029296875, 14.75830078125, 15.513671875, 16.26904296875, 17.0244140625, 17.77978515625, 18.53515625, 19.29052734375, 20.0458984375, 20.80126953125, 21.556640625, 22.31201171875, 23.0673828125, 23.82275390625, 24.578125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 5.0, 12.0, 15.0, 12.0, 12.0, 10.0, 23.0, 22.0, 37.0, 34.0, 33.0, 39.0, 31.0, 49.0, 46.0, 58.0, 54.0, 38.0, 47.0, 62.0, 47.0, 30.0, 42.0, 38.0, 33.0, 19.0, 32.0, 19.0, 20.0, 12.0, 11.0, 7.0, 9.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.798828125, -2.715789794921875, -2.63275146484375, -2.549713134765625, -2.4666748046875, -2.383636474609375, -2.30059814453125, -2.217559814453125, -2.134521484375, -2.051483154296875, -1.96844482421875, -1.885406494140625, -1.8023681640625, -1.719329833984375, -1.63629150390625, -1.553253173828125, -1.47021484375, -1.387176513671875, -1.30413818359375, -1.221099853515625, -1.1380615234375, -1.055023193359375, -0.97198486328125, -0.888946533203125, -0.805908203125, -0.722869873046875, -0.63983154296875, -0.556793212890625, -0.4737548828125, -0.390716552734375, -0.30767822265625, -0.224639892578125, -0.1416015625, -0.058563232421875, 0.02447509765625, 0.107513427734375, 0.1905517578125, 0.273590087890625, 0.35662841796875, 0.439666748046875, 0.522705078125, 0.605743408203125, 0.68878173828125, 0.771820068359375, 0.8548583984375, 0.937896728515625, 1.02093505859375, 1.103973388671875, 1.18701171875, 1.270050048828125, 1.35308837890625, 1.436126708984375, 1.5191650390625, 1.602203369140625, 1.68524169921875, 1.768280029296875, 1.851318359375, 1.934356689453125, 2.01739501953125, 2.100433349609375, 2.1834716796875, 2.266510009765625, 2.34954833984375, 2.432586669921875, 2.515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 5.0, 8.0, 16.0, 26.0, 33.0, 64.0, 120.0, 202.0, 345.0, 606.0, 1142.0, 2338.0, 5297.0, 13828.0, 44103.0, 183018.0, 2264404.0, 1454759.0, 161164.0, 40048.0, 12981.0, 5073.0, 2276.0, 1125.0, 517.0, 311.0, 178.0, 112.0, 66.0, 39.0, 26.0, 16.0, 12.0, 10.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53125, -22.625, -21.71875, -20.8125, -19.90625, -19.0, -18.09375, -17.1875, -16.28125, -15.375, -14.46875, -13.5625, -12.65625, -11.75, -10.84375, -9.9375, -9.03125, -8.125, -7.21875, -6.3125, -5.40625, -4.5, -3.59375, -2.6875, -1.78125, -0.875, 0.03125, 0.9375, 1.84375, 2.75, 3.65625, 4.5625, 5.46875, 6.375, 7.28125, 8.1875, 9.09375, 10.0, 10.90625, 11.8125, 12.71875, 13.625, 14.53125, 15.4375, 16.34375, 17.25, 18.15625, 19.0625, 19.96875, 20.875, 21.78125, 22.6875, 23.59375, 24.5, 25.40625, 26.3125, 27.21875, 28.125, 29.03125, 29.9375, 30.84375, 31.75, 32.65625, 33.5625, 34.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 12.0, 9.0, 14.0, 16.0, 23.0, 24.0, 41.0, 48.0, 68.0, 97.0, 123.0, 224.0, 306.0, 715.0, 1247.0, 380.0, 205.0, 148.0, 84.0, 72.0, 44.0, 51.0, 24.0, 18.0, 20.0, 9.0, 7.0, 4.0, 7.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.109375, -6.90130615234375, -6.6932373046875, -6.48516845703125, -6.277099609375, -6.06903076171875, -5.8609619140625, -5.65289306640625, -5.44482421875, -5.23675537109375, -5.0286865234375, -4.82061767578125, -4.612548828125, -4.40447998046875, -4.1964111328125, -3.98834228515625, -3.7802734375, -3.57220458984375, -3.3641357421875, -3.15606689453125, -2.947998046875, -2.73992919921875, -2.5318603515625, -2.32379150390625, -2.11572265625, -1.90765380859375, -1.6995849609375, -1.49151611328125, -1.283447265625, -1.07537841796875, -0.8673095703125, -0.65924072265625, -0.451171875, -0.24310302734375, -0.0350341796875, 0.17303466796875, 0.381103515625, 0.58917236328125, 0.7972412109375, 1.00531005859375, 1.21337890625, 1.42144775390625, 1.6295166015625, 1.83758544921875, 2.045654296875, 2.25372314453125, 2.4617919921875, 2.66986083984375, 2.8779296875, 3.08599853515625, 3.2940673828125, 3.50213623046875, 3.710205078125, 3.91827392578125, 4.1263427734375, 4.33441162109375, 4.54248046875, 4.75054931640625, 4.9586181640625, 5.16668701171875, 5.374755859375, 5.58282470703125, 5.7908935546875, 5.99896240234375, 6.20703125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 14.0, 21.0, 64.0, 74.0, 157.0, 177.0, 171.0, 135.0, 93.0, 51.0, 22.0, 13.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.34422302246094, -124.75031280517578, -122.15640258789062, -119.5625, -116.96858978271484, -114.37467956542969, -111.78076934814453, -109.18685913085938, -106.59294891357422, -103.99903869628906, -101.4051284790039, -98.81121826171875, -96.21731567382812, -93.62340545654297, -91.02949523925781, -88.43558502197266, -85.8416748046875, -83.24776458740234, -80.65385437011719, -78.05995178222656, -75.4660415649414, -72.87213134765625, -70.2782211303711, -67.68431091308594, -65.09040832519531, -62.496498107910156, -59.902591705322266, -57.30868148803711, -54.71477127075195, -52.12086486816406, -49.526954650878906, -46.93304443359375, -44.339134216308594, -41.74522399902344, -39.15131759643555, -36.55740737915039, -33.963497161865234, -31.36958885192871, -28.775680541992188, -26.18177032470703, -23.587862014770508, -20.993953704833984, -18.400043487548828, -15.806135177612305, -13.212225914001465, -10.618316650390625, -8.024408340454102, -5.430498123168945, -2.836589813232422, -0.24268078804016113, 2.3512282371520996, 4.945137023925781, 7.539046287536621, 10.132955551147461, 12.726863861083984, 15.32077407836914, 17.914682388305664, 20.508590698242188, 23.102500915527344, 25.696409225463867, 28.29031753540039, 30.884227752685547, 33.47813415527344, 36.072044372558594, 38.66595458984375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 1.0, 9.0, 10.0, 9.0, 16.0, 19.0, 23.0, 22.0, 28.0, 34.0, 25.0, 29.0, 30.0, 38.0, 47.0, 47.0, 41.0, 43.0, 64.0, 39.0, 37.0, 42.0, 50.0, 31.0, 29.0, 34.0, 32.0, 32.0, 23.0, 16.0, 15.0, 18.0, 13.0, 11.0, 7.0, 16.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.120281219482422, -22.178024291992188, -21.235767364501953, -20.29351043701172, -19.35125160217285, -18.408994674682617, -17.466737747192383, -16.52448081970215, -15.582223892211914, -14.63996696472168, -13.697709083557129, -12.755452156066895, -11.81319522857666, -10.87093734741211, -9.928680419921875, -8.98642349243164, -8.04416561126709, -7.101908206939697, -6.159651279449463, -5.21739387512207, -4.275136947631836, -3.3328795433044434, -2.390622138977051, -1.4483652114868164, -0.5061078071594238, 0.4361494183540344, 1.3784066438674927, 2.3206639289855957, 3.262921094894409, 4.205178260803223, 5.147435665130615, 6.08969259262085, 7.031949996948242, 7.974207401275635, 8.916464805603027, 9.858721733093262, 10.800978660583496, 11.743236541748047, 12.685493469238281, 13.627750396728516, 14.57000732421875, 15.512264251708984, 16.45452117919922, 17.396778106689453, 18.33903694152832, 19.281293869018555, 20.22355079650879, 21.165807723999023, 22.10806655883789, 23.050323486328125, 23.99258041381836, 24.934837341308594, 25.87709617614746, 26.819353103637695, 27.76161003112793, 28.703866958618164, 29.6461238861084, 30.588380813598633, 31.530637741088867, 32.472896575927734, 33.41515350341797, 34.3574104309082, 35.29966735839844, 36.24192428588867, 37.184181213378906]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 12.0, 18.0, 21.0, 43.0, 41.0, 86.0, 169.0, 248.0, 448.0, 877.0, 1735.0, 3563.0, 7146.0, 15399.0, 33799.0, 76562.0, 165531.0, 296265.0, 237140.0, 113610.0, 51549.0, 23330.0, 10753.0, 4995.0, 2476.0, 1222.0, 616.0, 337.0, 220.0, 131.0, 74.0, 40.0, 29.0, 13.0, 22.0, 13.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.5625, -17.084716796875, -16.60693359375, -16.129150390625, -15.6513671875, -15.173583984375, -14.69580078125, -14.218017578125, -13.740234375, -13.262451171875, -12.78466796875, -12.306884765625, -11.8291015625, -11.351318359375, -10.87353515625, -10.395751953125, -9.91796875, -9.440185546875, -8.96240234375, -8.484619140625, -8.0068359375, -7.529052734375, -7.05126953125, -6.573486328125, -6.095703125, -5.617919921875, -5.14013671875, -4.662353515625, -4.1845703125, -3.706787109375, -3.22900390625, -2.751220703125, -2.2734375, -1.795654296875, -1.31787109375, -0.840087890625, -0.3623046875, 0.115478515625, 0.59326171875, 1.071044921875, 1.548828125, 2.026611328125, 2.50439453125, 2.982177734375, 3.4599609375, 3.937744140625, 4.41552734375, 4.893310546875, 5.37109375, 5.848876953125, 6.32666015625, 6.804443359375, 7.2822265625, 7.760009765625, 8.23779296875, 8.715576171875, 9.193359375, 9.671142578125, 10.14892578125, 10.626708984375, 11.1044921875, 11.582275390625, 12.06005859375, 12.537841796875, 13.015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 6.0, 10.0, 7.0, 9.0, 10.0, 17.0, 12.0, 19.0, 20.0, 28.0, 36.0, 30.0, 27.0, 33.0, 40.0, 48.0, 48.0, 52.0, 59.0, 37.0, 47.0, 42.0, 50.0, 42.0, 36.0, 37.0, 26.0, 32.0, 24.0, 16.0, 20.0, 13.0, 13.0, 12.0, 5.0, 11.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.962890625, -2.877197265625, -2.79150390625, -2.705810546875, -2.6201171875, -2.534423828125, -2.44873046875, -2.363037109375, -2.27734375, -2.191650390625, -2.10595703125, -2.020263671875, -1.9345703125, -1.848876953125, -1.76318359375, -1.677490234375, -1.591796875, -1.506103515625, -1.42041015625, -1.334716796875, -1.2490234375, -1.163330078125, -1.07763671875, -0.991943359375, -0.90625, -0.820556640625, -0.73486328125, -0.649169921875, -0.5634765625, -0.477783203125, -0.39208984375, -0.306396484375, -0.220703125, -0.135009765625, -0.04931640625, 0.036376953125, 0.1220703125, 0.207763671875, 0.29345703125, 0.379150390625, 0.46484375, 0.550537109375, 0.63623046875, 0.721923828125, 0.8076171875, 0.893310546875, 0.97900390625, 1.064697265625, 1.150390625, 1.236083984375, 1.32177734375, 1.407470703125, 1.4931640625, 1.578857421875, 1.66455078125, 1.750244140625, 1.8359375, 1.921630859375, 2.00732421875, 2.093017578125, 2.1787109375, 2.264404296875, 2.35009765625, 2.435791015625, 2.521484375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 10.0, 10.0, 14.0, 20.0, 29.0, 42.0, 62.0, 94.0, 132.0, 217.0, 338.0, 555.0, 937.0, 1865.0, 3849.0, 8429.0, 21329.0, 57799.0, 156989.0, 356890.0, 271224.0, 103642.0, 37470.0, 14315.0, 6072.0, 2796.0, 1406.0, 788.0, 443.0, 249.0, 173.0, 95.0, 84.0, 50.0, 46.0, 19.0, 25.0, 9.0, 11.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.640625, -20.02978515625, -19.4189453125, -18.80810546875, -18.197265625, -17.58642578125, -16.9755859375, -16.36474609375, -15.75390625, -15.14306640625, -14.5322265625, -13.92138671875, -13.310546875, -12.69970703125, -12.0888671875, -11.47802734375, -10.8671875, -10.25634765625, -9.6455078125, -9.03466796875, -8.423828125, -7.81298828125, -7.2021484375, -6.59130859375, -5.98046875, -5.36962890625, -4.7587890625, -4.14794921875, -3.537109375, -2.92626953125, -2.3154296875, -1.70458984375, -1.09375, -0.48291015625, 0.1279296875, 0.73876953125, 1.349609375, 1.96044921875, 2.5712890625, 3.18212890625, 3.79296875, 4.40380859375, 5.0146484375, 5.62548828125, 6.236328125, 6.84716796875, 7.4580078125, 8.06884765625, 8.6796875, 9.29052734375, 9.9013671875, 10.51220703125, 11.123046875, 11.73388671875, 12.3447265625, 12.95556640625, 13.56640625, 14.17724609375, 14.7880859375, 15.39892578125, 16.009765625, 16.62060546875, 17.2314453125, 17.84228515625, 18.453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 6.0, 10.0, 12.0, 13.0, 13.0, 20.0, 26.0, 22.0, 35.0, 24.0, 40.0, 41.0, 39.0, 55.0, 48.0, 44.0, 45.0, 46.0, 38.0, 56.0, 44.0, 48.0, 37.0, 33.0, 32.0, 29.0, 23.0, 20.0, 16.0, 10.0, 10.0, 7.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.375, -16.8536376953125, -16.332275390625, -15.8109130859375, -15.28955078125, -14.7681884765625, -14.246826171875, -13.7254638671875, -13.2041015625, -12.6827392578125, -12.161376953125, -11.6400146484375, -11.11865234375, -10.5972900390625, -10.075927734375, -9.5545654296875, -9.033203125, -8.5118408203125, -7.990478515625, -7.4691162109375, -6.94775390625, -6.4263916015625, -5.905029296875, -5.3836669921875, -4.8623046875, -4.3409423828125, -3.819580078125, -3.2982177734375, -2.77685546875, -2.2554931640625, -1.734130859375, -1.2127685546875, -0.69140625, -0.1700439453125, 0.351318359375, 0.8726806640625, 1.39404296875, 1.9154052734375, 2.436767578125, 2.9581298828125, 3.4794921875, 4.0008544921875, 4.522216796875, 5.0435791015625, 5.56494140625, 6.0863037109375, 6.607666015625, 7.1290283203125, 7.650390625, 8.1717529296875, 8.693115234375, 9.2144775390625, 9.73583984375, 10.2572021484375, 10.778564453125, 11.2999267578125, 11.8212890625, 12.3426513671875, 12.864013671875, 13.3853759765625, 13.90673828125, 14.4281005859375, 14.949462890625, 15.4708251953125, 15.9921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 19.0, 32.0, 31.0, 65.0, 70.0, 109.0, 194.0, 340.0, 624.0, 1255.0, 2595.0, 6423.0, 16487.0, 50088.0, 171337.0, 433786.0, 253564.0, 72920.0, 23358.0, 8468.0, 3366.0, 1535.0, 787.0, 427.0, 254.0, 128.0, 90.0, 54.0, 42.0, 27.0, 18.0, 9.0, 13.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6484375, -9.333740234375, -9.01904296875, -8.704345703125, -8.3896484375, -8.074951171875, -7.76025390625, -7.445556640625, -7.130859375, -6.816162109375, -6.50146484375, -6.186767578125, -5.8720703125, -5.557373046875, -5.24267578125, -4.927978515625, -4.61328125, -4.298583984375, -3.98388671875, -3.669189453125, -3.3544921875, -3.039794921875, -2.72509765625, -2.410400390625, -2.095703125, -1.781005859375, -1.46630859375, -1.151611328125, -0.8369140625, -0.522216796875, -0.20751953125, 0.107177734375, 0.421875, 0.736572265625, 1.05126953125, 1.365966796875, 1.6806640625, 1.995361328125, 2.31005859375, 2.624755859375, 2.939453125, 3.254150390625, 3.56884765625, 3.883544921875, 4.1982421875, 4.512939453125, 4.82763671875, 5.142333984375, 5.45703125, 5.771728515625, 6.08642578125, 6.401123046875, 6.7158203125, 7.030517578125, 7.34521484375, 7.659912109375, 7.974609375, 8.289306640625, 8.60400390625, 8.918701171875, 9.2333984375, 9.548095703125, 9.86279296875, 10.177490234375, 10.4921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 0.0, 3.0, 5.0, 5.0, 8.0, 6.0, 16.0, 15.0, 17.0, 23.0, 22.0, 35.0, 55.0, 47.0, 72.0, 105.0, 113.0, 106.0, 75.0, 57.0, 35.0, 37.0, 30.0, 28.0, 17.0, 11.0, 19.0, 11.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0018749237060546875, -0.001817077398300171, -0.0017592310905456543, -0.0017013847827911377, -0.001643538475036621, -0.0015856921672821045, -0.0015278458595275879, -0.0014699995517730713, -0.0014121532440185547, -0.001354306936264038, -0.0012964606285095215, -0.0012386143207550049, -0.0011807680130004883, -0.0011229217052459717, -0.001065075397491455, -0.0010072290897369385, -0.0009493827819824219, -0.0008915364742279053, -0.0008336901664733887, -0.0007758438587188721, -0.0007179975509643555, -0.0006601512432098389, -0.0006023049354553223, -0.0005444586277008057, -0.00048661231994628906, -0.00042876601219177246, -0.00037091970443725586, -0.00031307339668273926, -0.00025522708892822266, -0.00019738078117370605, -0.00013953447341918945, -8.168816566467285e-05, -2.384185791015625e-05, 3.400444984436035e-05, 9.185075759887695e-05, 0.00014969706535339355, 0.00020754337310791016, 0.00026538968086242676, 0.00032323598861694336, 0.00038108229637145996, 0.00043892860412597656, 0.0004967749118804932, 0.0005546212196350098, 0.0006124675273895264, 0.000670313835144043, 0.0007281601428985596, 0.0007860064506530762, 0.0008438527584075928, 0.0009016990661621094, 0.000959545373916626, 0.0010173916816711426, 0.0010752379894256592, 0.0011330842971801758, 0.0011909306049346924, 0.001248776912689209, 0.0013066232204437256, 0.0013644695281982422, 0.0014223158359527588, 0.0014801621437072754, 0.001538008451461792, 0.0015958547592163086, 0.0016537010669708252, 0.0017115473747253418, 0.0017693936824798584, 0.001827239990234375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 9.0, 31.0, 30.0, 38.0, 48.0, 83.0, 105.0, 181.0, 292.0, 500.0, 834.0, 1727.0, 3463.0, 7993.0, 19435.0, 54214.0, 177292.0, 439013.0, 231809.0, 69406.0, 23779.0, 9611.0, 4200.0, 2007.0, 1010.0, 506.0, 305.0, 201.0, 122.0, 83.0, 56.0, 43.0, 35.0, 25.0, 9.0, 14.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.9296875, -8.6175537109375, -8.305419921875, -7.9932861328125, -7.68115234375, -7.3690185546875, -7.056884765625, -6.7447509765625, -6.4326171875, -6.1204833984375, -5.808349609375, -5.4962158203125, -5.18408203125, -4.8719482421875, -4.559814453125, -4.2476806640625, -3.935546875, -3.6234130859375, -3.311279296875, -2.9991455078125, -2.68701171875, -2.3748779296875, -2.062744140625, -1.7506103515625, -1.4384765625, -1.1263427734375, -0.814208984375, -0.5020751953125, -0.18994140625, 0.1221923828125, 0.434326171875, 0.7464599609375, 1.05859375, 1.3707275390625, 1.682861328125, 1.9949951171875, 2.30712890625, 2.6192626953125, 2.931396484375, 3.2435302734375, 3.5556640625, 3.8677978515625, 4.179931640625, 4.4920654296875, 4.80419921875, 5.1163330078125, 5.428466796875, 5.7406005859375, 6.052734375, 6.3648681640625, 6.677001953125, 6.9891357421875, 7.30126953125, 7.6134033203125, 7.925537109375, 8.2376708984375, 8.5498046875, 8.8619384765625, 9.174072265625, 9.4862060546875, 9.79833984375, 10.1104736328125, 10.422607421875, 10.7347412109375, 11.046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 2.0, 6.0, 10.0, 9.0, 12.0, 9.0, 24.0, 24.0, 25.0, 29.0, 38.0, 51.0, 62.0, 75.0, 81.0, 89.0, 77.0, 59.0, 68.0, 57.0, 43.0, 31.0, 28.0, 17.0, 17.0, 8.0, 8.0, 6.0, 5.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.27423095703125, -9.0328369140625, -8.79144287109375, -8.550048828125, -8.30865478515625, -8.0672607421875, -7.82586669921875, -7.58447265625, -7.34307861328125, -7.1016845703125, -6.86029052734375, -6.618896484375, -6.37750244140625, -6.1361083984375, -5.89471435546875, -5.6533203125, -5.41192626953125, -5.1705322265625, -4.92913818359375, -4.687744140625, -4.44635009765625, -4.2049560546875, -3.96356201171875, -3.72216796875, -3.48077392578125, -3.2393798828125, -2.99798583984375, -2.756591796875, -2.51519775390625, -2.2738037109375, -2.03240966796875, -1.791015625, -1.54962158203125, -1.3082275390625, -1.06683349609375, -0.825439453125, -0.58404541015625, -0.3426513671875, -0.10125732421875, 0.14013671875, 0.38153076171875, 0.6229248046875, 0.86431884765625, 1.105712890625, 1.34710693359375, 1.5885009765625, 1.82989501953125, 2.0712890625, 2.31268310546875, 2.5540771484375, 2.79547119140625, 3.036865234375, 3.27825927734375, 3.5196533203125, 3.76104736328125, 4.00244140625, 4.24383544921875, 4.4852294921875, 4.72662353515625, 4.968017578125, 5.20941162109375, 5.4508056640625, 5.69219970703125, 5.93359375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 4.0, 13.0, 21.0, 30.0, 49.0, 63.0, 87.0, 113.0, 138.0, 127.0, 104.0, 81.0, 50.0, 43.0, 25.0, 19.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.12112426757812, -109.714111328125, -105.30709838867188, -100.90008544921875, -96.49308013916016, -92.08606719970703, -87.6790542602539, -83.27204132080078, -78.86503601074219, -74.45802307128906, -70.05101013183594, -65.64399719238281, -61.23699188232422, -56.829978942871094, -52.42296600341797, -48.015953063964844, -43.60894012451172, -39.201927185058594, -34.794918060302734, -30.38790512084961, -25.980894088745117, -21.573883056640625, -17.1668701171875, -12.759859085083008, -8.352848052978516, -3.9458365440368652, 0.46117496490478516, 4.868186950683594, 9.275197982788086, 13.682209014892578, 18.089221954345703, 22.496232986450195, 26.903244018554688, 31.31025505065918, 35.71726608276367, 40.1242790222168, 44.531288146972656, 48.93830108642578, 53.345314025878906, 57.75232696533203, 62.15933609008789, 66.56634521484375, 70.97335815429688, 75.38037109375, 79.78738403320312, 84.19439697265625, 88.60140991210938, 93.00841522216797, 97.4154281616211, 101.82244110107422, 106.22945404052734, 110.63645935058594, 115.04347229003906, 119.45048522949219, 123.85749816894531, 128.26451110839844, 132.67152404785156, 137.0785369873047, 141.4855499267578, 145.89256286621094, 150.29957580566406, 154.70657348632812, 159.11358642578125, 163.52059936523438, 167.9276123046875]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 5.0, 11.0, 17.0, 10.0, 15.0, 15.0, 17.0, 30.0, 33.0, 40.0, 38.0, 45.0, 54.0, 44.0, 41.0, 44.0, 60.0, 53.0, 51.0, 44.0, 51.0, 43.0, 43.0, 36.0, 27.0, 25.0, 13.0, 18.0, 13.0, 10.0, 10.0, 13.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-116.56708526611328, -113.34964752197266, -110.1322021484375, -106.91476440429688, -103.69732666015625, -100.4798812866211, -97.26244354248047, -94.04499816894531, -90.82756042480469, -87.61012268066406, -84.3926773071289, -81.17523956298828, -77.95779418945312, -74.7403564453125, -71.52291870117188, -68.30548095703125, -65.0880355834961, -61.8705940246582, -58.65315246582031, -55.43571472167969, -52.2182731628418, -49.000831604003906, -45.78339385986328, -42.56595230102539, -39.3485107421875, -36.13106918334961, -32.91362762451172, -29.696189880371094, -26.478748321533203, -23.261306762695312, -20.043867111206055, -16.826427459716797, -13.608978271484375, -10.3915376663208, -7.174097061157227, -3.9566564559936523, -0.7392158508300781, 2.4782257080078125, 5.69566535949707, 8.913105010986328, 12.130546569824219, 15.347987174987793, 18.565427780151367, 21.782867431640625, 25.000308990478516, 28.217750549316406, 31.435190200805664, 34.65262985229492, 37.87007141113281, 41.0875129699707, 44.304954528808594, 47.52239227294922, 50.73983383178711, 53.957275390625, 57.174713134765625, 60.392154693603516, 63.609596252441406, 66.82703399658203, 70.04447937011719, 73.26191711425781, 76.47935485839844, 79.6968002319336, 82.91423797607422, 86.13168334960938, 89.34912109375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 7.0, 8.0, 18.0, 21.0, 40.0, 58.0, 81.0, 138.0, 260.0, 427.0, 672.0, 1216.0, 2315.0, 4706.0, 10185.0, 24422.0, 70483.0, 314369.0, 3382206.0, 276153.0, 65190.0, 22602.0, 9239.0, 4501.0, 2078.0, 1182.0, 638.0, 390.0, 233.0, 152.0, 101.0, 60.0, 33.0, 29.0, 24.0, 15.0, 10.0, 4.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.890625, -17.2392578125, -16.587890625, -15.9365234375, -15.28515625, -14.6337890625, -13.982421875, -13.3310546875, -12.6796875, -12.0283203125, -11.376953125, -10.7255859375, -10.07421875, -9.4228515625, -8.771484375, -8.1201171875, -7.46875, -6.8173828125, -6.166015625, -5.5146484375, -4.86328125, -4.2119140625, -3.560546875, -2.9091796875, -2.2578125, -1.6064453125, -0.955078125, -0.3037109375, 0.34765625, 0.9990234375, 1.650390625, 2.3017578125, 2.953125, 3.6044921875, 4.255859375, 4.9072265625, 5.55859375, 6.2099609375, 6.861328125, 7.5126953125, 8.1640625, 8.8154296875, 9.466796875, 10.1181640625, 10.76953125, 11.4208984375, 12.072265625, 12.7236328125, 13.375, 14.0263671875, 14.677734375, 15.3291015625, 15.98046875, 16.6318359375, 17.283203125, 17.9345703125, 18.5859375, 19.2373046875, 19.888671875, 20.5400390625, 21.19140625, 21.8427734375, 22.494140625, 23.1455078125, 23.796875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 3.0, 11.0, 4.0, 12.0, 11.0, 9.0, 18.0, 20.0, 25.0, 27.0, 24.0, 27.0, 46.0, 29.0, 39.0, 43.0, 37.0, 60.0, 56.0, 51.0, 55.0, 38.0, 43.0, 40.0, 36.0, 33.0, 32.0, 25.0, 29.0, 21.0, 15.0, 6.0, 12.0, 15.0, 11.0, 7.0, 10.0, 6.0, 4.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.21484375, -3.1253662109375, -3.035888671875, -2.9464111328125, -2.85693359375, -2.7674560546875, -2.677978515625, -2.5885009765625, -2.4990234375, -2.4095458984375, -2.320068359375, -2.2305908203125, -2.14111328125, -2.0516357421875, -1.962158203125, -1.8726806640625, -1.783203125, -1.6937255859375, -1.604248046875, -1.5147705078125, -1.42529296875, -1.3358154296875, -1.246337890625, -1.1568603515625, -1.0673828125, -0.9779052734375, -0.888427734375, -0.7989501953125, -0.70947265625, -0.6199951171875, -0.530517578125, -0.4410400390625, -0.3515625, -0.2620849609375, -0.172607421875, -0.0831298828125, 0.00634765625, 0.0958251953125, 0.185302734375, 0.2747802734375, 0.3642578125, 0.4537353515625, 0.543212890625, 0.6326904296875, 0.72216796875, 0.8116455078125, 0.901123046875, 0.9906005859375, 1.080078125, 1.1695556640625, 1.259033203125, 1.3485107421875, 1.43798828125, 1.5274658203125, 1.616943359375, 1.7064208984375, 1.7958984375, 1.8853759765625, 1.974853515625, 2.0643310546875, 2.15380859375, 2.2432861328125, 2.332763671875, 2.4222412109375, 2.51171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 18.0, 26.0, 51.0, 78.0, 107.0, 172.0, 307.0, 528.0, 1022.0, 1752.0, 3497.0, 7677.0, 19279.0, 54618.0, 202193.0, 2701593.0, 991022.0, 142108.0, 41154.0, 14732.0, 6095.0, 2816.0, 1412.0, 832.0, 432.0, 293.0, 160.0, 99.0, 65.0, 40.0, 30.0, 18.0, 15.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.125, -22.399658203125, -21.67431640625, -20.948974609375, -20.2236328125, -19.498291015625, -18.77294921875, -18.047607421875, -17.322265625, -16.596923828125, -15.87158203125, -15.146240234375, -14.4208984375, -13.695556640625, -12.97021484375, -12.244873046875, -11.51953125, -10.794189453125, -10.06884765625, -9.343505859375, -8.6181640625, -7.892822265625, -7.16748046875, -6.442138671875, -5.716796875, -4.991455078125, -4.26611328125, -3.540771484375, -2.8154296875, -2.090087890625, -1.36474609375, -0.639404296875, 0.0859375, 0.811279296875, 1.53662109375, 2.261962890625, 2.9873046875, 3.712646484375, 4.43798828125, 5.163330078125, 5.888671875, 6.614013671875, 7.33935546875, 8.064697265625, 8.7900390625, 9.515380859375, 10.24072265625, 10.966064453125, 11.69140625, 12.416748046875, 13.14208984375, 13.867431640625, 14.5927734375, 15.318115234375, 16.04345703125, 16.768798828125, 17.494140625, 18.219482421875, 18.94482421875, 19.670166015625, 20.3955078125, 21.120849609375, 21.84619140625, 22.571533203125, 23.296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 5.0, 7.0, 18.0, 28.0, 16.0, 30.0, 41.0, 59.0, 85.0, 114.0, 203.0, 379.0, 1385.0, 849.0, 293.0, 173.0, 111.0, 57.0, 56.0, 38.0, 32.0, 17.0, 16.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.80859375, -6.5882568359375, -6.367919921875, -6.1475830078125, -5.92724609375, -5.7069091796875, -5.486572265625, -5.2662353515625, -5.0458984375, -4.8255615234375, -4.605224609375, -4.3848876953125, -4.16455078125, -3.9442138671875, -3.723876953125, -3.5035400390625, -3.283203125, -3.0628662109375, -2.842529296875, -2.6221923828125, -2.40185546875, -2.1815185546875, -1.961181640625, -1.7408447265625, -1.5205078125, -1.3001708984375, -1.079833984375, -0.8594970703125, -0.63916015625, -0.4188232421875, -0.198486328125, 0.0218505859375, 0.2421875, 0.4625244140625, 0.682861328125, 0.9031982421875, 1.12353515625, 1.3438720703125, 1.564208984375, 1.7845458984375, 2.0048828125, 2.2252197265625, 2.445556640625, 2.6658935546875, 2.88623046875, 3.1065673828125, 3.326904296875, 3.5472412109375, 3.767578125, 3.9879150390625, 4.208251953125, 4.4285888671875, 4.64892578125, 4.8692626953125, 5.089599609375, 5.3099365234375, 5.5302734375, 5.7506103515625, 5.970947265625, 6.1912841796875, 6.41162109375, 6.6319580078125, 6.852294921875, 7.0726318359375, 7.29296875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 11.0, 23.0, 41.0, 84.0, 179.0, 198.0, 209.0, 130.0, 59.0, 32.0, 24.0, 11.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.11735916137695, -38.554901123046875, -35.9924430847168, -33.42998504638672, -30.867528915405273, -28.305070877075195, -25.74261474609375, -23.180156707763672, -20.617698669433594, -18.055240631103516, -15.492783546447754, -12.930326461791992, -10.367868423461914, -7.805410385131836, -5.242953300476074, -2.6804962158203125, -0.11803817749023438, 2.4444193840026855, 5.0068769454956055, 7.569334506988525, 10.131792068481445, 12.694250106811523, 15.256707191467285, 17.819164276123047, 20.381622314453125, 22.944080352783203, 25.50653839111328, 28.068994522094727, 30.631452560424805, 33.19390869140625, 35.75636672973633, 38.318824768066406, 40.88128662109375, 43.44374465942383, 46.006202697753906, 48.568660736083984, 51.13111877441406, 53.693572998046875, 56.25603103637695, 58.81848907470703, 61.38094711303711, 63.94340515136719, 66.505859375, 69.06832122802734, 71.63077545166016, 74.1932373046875, 76.75569152832031, 79.31814575195312, 81.88060760498047, 84.44306182861328, 87.00552368164062, 89.56797790527344, 92.13043975830078, 94.6928939819336, 97.25535583496094, 99.81781005859375, 102.38026428222656, 104.94271850585938, 107.50518035888672, 110.06763458251953, 112.63009643554688, 115.19255065917969, 117.75501251220703, 120.31746673583984, 122.87992858886719]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 5.0, 8.0, 6.0, 13.0, 7.0, 11.0, 11.0, 17.0, 20.0, 14.0, 20.0, 28.0, 33.0, 30.0, 36.0, 40.0, 36.0, 43.0, 46.0, 39.0, 34.0, 35.0, 37.0, 47.0, 38.0, 40.0, 28.0, 34.0, 23.0, 29.0, 32.0, 31.0, 26.0, 27.0, 10.0, 17.0, 9.0, 7.0, 8.0, 9.0, 4.0, 3.0, 3.0, 6.0, 2.0, 0.0, 2.0], "bins": [-27.335079193115234, -26.576263427734375, -25.81744956970215, -25.05863380432129, -24.299819946289062, -23.541004180908203, -22.782188415527344, -22.023374557495117, -21.26456069946289, -20.50574493408203, -19.746931076049805, -18.988115310668945, -18.22930145263672, -17.47048568725586, -16.711669921875, -15.952856063842773, -15.194040298461914, -14.435225486755371, -13.676410675048828, -12.917594909667969, -12.158781051635742, -11.399965286254883, -10.64115047454834, -9.882335662841797, -9.123520851135254, -8.364706039428711, -7.605891227722168, -6.847075939178467, -6.088261127471924, -5.329446315765381, -4.57063102722168, -3.8118162155151367, -3.0530033111572266, -2.2941884994506836, -1.5353734493255615, -0.7765583992004395, -0.017743587493896484, 0.7410712242126465, 1.4998865127563477, 2.2587013244628906, 3.0175161361694336, 3.7763309478759766, 4.5351457595825195, 5.293961048126221, 6.052775859832764, 6.811590671539307, 7.570405960083008, 8.32922077178955, 9.088035583496094, 9.846850395202637, 10.60566520690918, 11.364480972290039, 12.123294830322266, 12.882110595703125, 13.640925407409668, 14.399740219116211, 15.158555030822754, 15.917369842529297, 16.676185607910156, 17.434999465942383, 18.193815231323242, 18.95262908935547, 19.711444854736328, 20.470260620117188, 21.229074478149414]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 9.0, 26.0, 23.0, 48.0, 70.0, 111.0, 193.0, 288.0, 540.0, 981.0, 1735.0, 3196.0, 6317.0, 11818.0, 23517.0, 47105.0, 93881.0, 182018.0, 268114.0, 197726.0, 104813.0, 52145.0, 25933.0, 13123.0, 6745.0, 3639.0, 1920.0, 1065.0, 608.0, 342.0, 183.0, 102.0, 80.0, 52.0, 21.0, 16.0, 12.0, 15.0, 5.0, 7.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.4010009765625, -11.981689453125, -11.5623779296875, -11.14306640625, -10.7237548828125, -10.304443359375, -9.8851318359375, -9.4658203125, -9.0465087890625, -8.627197265625, -8.2078857421875, -7.78857421875, -7.3692626953125, -6.949951171875, -6.5306396484375, -6.111328125, -5.6920166015625, -5.272705078125, -4.8533935546875, -4.43408203125, -4.0147705078125, -3.595458984375, -3.1761474609375, -2.7568359375, -2.3375244140625, -1.918212890625, -1.4989013671875, -1.07958984375, -0.6602783203125, -0.240966796875, 0.1783447265625, 0.59765625, 1.0169677734375, 1.436279296875, 1.8555908203125, 2.27490234375, 2.6942138671875, 3.113525390625, 3.5328369140625, 3.9521484375, 4.3714599609375, 4.790771484375, 5.2100830078125, 5.62939453125, 6.0487060546875, 6.468017578125, 6.8873291015625, 7.306640625, 7.7259521484375, 8.145263671875, 8.5645751953125, 8.98388671875, 9.4031982421875, 9.822509765625, 10.2418212890625, 10.6611328125, 11.0804443359375, 11.499755859375, 11.9190673828125, 12.33837890625, 12.7576904296875, 13.177001953125, 13.5963134765625, 14.015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 8.0, 10.0, 10.0, 12.0, 12.0, 15.0, 18.0, 23.0, 36.0, 35.0, 39.0, 30.0, 43.0, 57.0, 35.0, 40.0, 57.0, 53.0, 43.0, 38.0, 42.0, 53.0, 26.0, 38.0, 36.0, 33.0, 26.0, 21.0, 21.0, 17.0, 7.0, 22.0, 10.0, 8.0, 3.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.220703125, -3.124359130859375, -3.02801513671875, -2.931671142578125, -2.8353271484375, -2.738983154296875, -2.64263916015625, -2.546295166015625, -2.449951171875, -2.353607177734375, -2.25726318359375, -2.160919189453125, -2.0645751953125, -1.968231201171875, -1.87188720703125, -1.775543212890625, -1.67919921875, -1.582855224609375, -1.48651123046875, -1.390167236328125, -1.2938232421875, -1.197479248046875, -1.10113525390625, -1.004791259765625, -0.908447265625, -0.812103271484375, -0.71575927734375, -0.619415283203125, -0.5230712890625, -0.426727294921875, -0.33038330078125, -0.234039306640625, -0.1376953125, -0.041351318359375, 0.05499267578125, 0.151336669921875, 0.2476806640625, 0.344024658203125, 0.44036865234375, 0.536712646484375, 0.633056640625, 0.729400634765625, 0.82574462890625, 0.922088623046875, 1.0184326171875, 1.114776611328125, 1.21112060546875, 1.307464599609375, 1.40380859375, 1.500152587890625, 1.59649658203125, 1.692840576171875, 1.7891845703125, 1.885528564453125, 1.98187255859375, 2.078216552734375, 2.174560546875, 2.270904541015625, 2.36724853515625, 2.463592529296875, 2.5599365234375, 2.656280517578125, 2.75262451171875, 2.848968505859375, 2.9453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 8.0, 16.0, 17.0, 24.0, 41.0, 63.0, 92.0, 164.0, 265.0, 362.0, 769.0, 1561.0, 3824.0, 11697.0, 41443.0, 154354.0, 452539.0, 275190.0, 74851.0, 20159.0, 6301.0, 2366.0, 1070.0, 554.0, 300.0, 191.0, 106.0, 77.0, 50.0, 29.0, 14.0, 10.0, 18.0, 11.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.890625, -22.191162109375, -21.49169921875, -20.792236328125, -20.0927734375, -19.393310546875, -18.69384765625, -17.994384765625, -17.294921875, -16.595458984375, -15.89599609375, -15.196533203125, -14.4970703125, -13.797607421875, -13.09814453125, -12.398681640625, -11.69921875, -10.999755859375, -10.30029296875, -9.600830078125, -8.9013671875, -8.201904296875, -7.50244140625, -6.802978515625, -6.103515625, -5.404052734375, -4.70458984375, -4.005126953125, -3.3056640625, -2.606201171875, -1.90673828125, -1.207275390625, -0.5078125, 0.191650390625, 0.89111328125, 1.590576171875, 2.2900390625, 2.989501953125, 3.68896484375, 4.388427734375, 5.087890625, 5.787353515625, 6.48681640625, 7.186279296875, 7.8857421875, 8.585205078125, 9.28466796875, 9.984130859375, 10.68359375, 11.383056640625, 12.08251953125, 12.781982421875, 13.4814453125, 14.180908203125, 14.88037109375, 15.579833984375, 16.279296875, 16.978759765625, 17.67822265625, 18.377685546875, 19.0771484375, 19.776611328125, 20.47607421875, 21.175537109375, 21.875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 8.0, 1.0, 9.0, 8.0, 12.0, 8.0, 10.0, 19.0, 14.0, 26.0, 17.0, 30.0, 28.0, 42.0, 29.0, 38.0, 42.0, 34.0, 45.0, 46.0, 42.0, 38.0, 44.0, 35.0, 46.0, 49.0, 42.0, 33.0, 28.0, 27.0, 26.0, 18.0, 26.0, 19.0, 12.0, 7.0, 10.0, 7.0, 7.0, 7.0, 1.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.109375, -14.67626953125, -14.2431640625, -13.81005859375, -13.376953125, -12.94384765625, -12.5107421875, -12.07763671875, -11.64453125, -11.21142578125, -10.7783203125, -10.34521484375, -9.912109375, -9.47900390625, -9.0458984375, -8.61279296875, -8.1796875, -7.74658203125, -7.3134765625, -6.88037109375, -6.447265625, -6.01416015625, -5.5810546875, -5.14794921875, -4.71484375, -4.28173828125, -3.8486328125, -3.41552734375, -2.982421875, -2.54931640625, -2.1162109375, -1.68310546875, -1.25, -0.81689453125, -0.3837890625, 0.04931640625, 0.482421875, 0.91552734375, 1.3486328125, 1.78173828125, 2.21484375, 2.64794921875, 3.0810546875, 3.51416015625, 3.947265625, 4.38037109375, 4.8134765625, 5.24658203125, 5.6796875, 6.11279296875, 6.5458984375, 6.97900390625, 7.412109375, 7.84521484375, 8.2783203125, 8.71142578125, 9.14453125, 9.57763671875, 10.0107421875, 10.44384765625, 10.876953125, 11.31005859375, 11.7431640625, 12.17626953125, 12.609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 7.0, 7.0, 12.0, 19.0, 24.0, 31.0, 52.0, 85.0, 150.0, 281.0, 461.0, 969.0, 2024.0, 4563.0, 12155.0, 37800.0, 152340.0, 484974.0, 261238.0, 61958.0, 17687.0, 6318.0, 2617.0, 1290.0, 625.0, 337.0, 193.0, 123.0, 81.0, 49.0, 27.0, 21.0, 11.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.0625, -11.7147216796875, -11.366943359375, -11.0191650390625, -10.67138671875, -10.3236083984375, -9.975830078125, -9.6280517578125, -9.2802734375, -8.9324951171875, -8.584716796875, -8.2369384765625, -7.88916015625, -7.5413818359375, -7.193603515625, -6.8458251953125, -6.498046875, -6.1502685546875, -5.802490234375, -5.4547119140625, -5.10693359375, -4.7591552734375, -4.411376953125, -4.0635986328125, -3.7158203125, -3.3680419921875, -3.020263671875, -2.6724853515625, -2.32470703125, -1.9769287109375, -1.629150390625, -1.2813720703125, -0.93359375, -0.5858154296875, -0.238037109375, 0.1097412109375, 0.45751953125, 0.8052978515625, 1.153076171875, 1.5008544921875, 1.8486328125, 2.1964111328125, 2.544189453125, 2.8919677734375, 3.23974609375, 3.5875244140625, 3.935302734375, 4.2830810546875, 4.630859375, 4.9786376953125, 5.326416015625, 5.6741943359375, 6.02197265625, 6.3697509765625, 6.717529296875, 7.0653076171875, 7.4130859375, 7.7608642578125, 8.108642578125, 8.4564208984375, 8.80419921875, 9.1519775390625, 9.499755859375, 9.8475341796875, 10.1953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 8.0, 10.0, 9.0, 21.0, 35.0, 50.0, 61.0, 73.0, 141.0, 185.0, 117.0, 72.0, 53.0, 28.0, 36.0, 24.0, 16.0, 15.0, 7.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002399444580078125, -0.0023117363452911377, -0.0022240281105041504, -0.002136319875717163, -0.0020486116409301758, -0.0019609034061431885, -0.0018731951713562012, -0.0017854869365692139, -0.0016977787017822266, -0.0016100704669952393, -0.001522362232208252, -0.0014346539974212646, -0.0013469457626342773, -0.00125923752784729, -0.0011715292930603027, -0.0010838210582733154, -0.0009961128234863281, -0.0009084045886993408, -0.0008206963539123535, -0.0007329881191253662, -0.0006452798843383789, -0.0005575716495513916, -0.0004698634147644043, -0.000382155179977417, -0.0002944469451904297, -0.00020673871040344238, -0.00011903047561645508, -3.1322240829467773e-05, 5.638599395751953e-05, 0.00014409422874450684, 0.00023180246353149414, 0.00031951069831848145, 0.00040721893310546875, 0.0004949271678924561, 0.0005826354026794434, 0.0006703436374664307, 0.000758051872253418, 0.0008457601070404053, 0.0009334683418273926, 0.0010211765766143799, 0.0011088848114013672, 0.0011965930461883545, 0.0012843012809753418, 0.001372009515762329, 0.0014597177505493164, 0.0015474259853363037, 0.001635134220123291, 0.0017228424549102783, 0.0018105506896972656, 0.001898258924484253, 0.0019859671592712402, 0.0020736753940582275, 0.002161383628845215, 0.002249091863632202, 0.0023368000984191895, 0.0024245083332061768, 0.002512216567993164, 0.0025999248027801514, 0.0026876330375671387, 0.002775341272354126, 0.0028630495071411133, 0.0029507577419281006, 0.003038465976715088, 0.003126174211502075, 0.0032138824462890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 14.0, 12.0, 23.0, 42.0, 41.0, 63.0, 128.0, 189.0, 384.0, 673.0, 1405.0, 2841.0, 6964.0, 20270.0, 76767.0, 370725.0, 436077.0, 93816.0, 23759.0, 7916.0, 3218.0, 1507.0, 754.0, 351.0, 211.0, 134.0, 90.0, 52.0, 34.0, 27.0, 16.0, 15.0, 11.0, 2.0, 8.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.96875, -12.5765380859375, -12.184326171875, -11.7921142578125, -11.39990234375, -11.0076904296875, -10.615478515625, -10.2232666015625, -9.8310546875, -9.4388427734375, -9.046630859375, -8.6544189453125, -8.26220703125, -7.8699951171875, -7.477783203125, -7.0855712890625, -6.693359375, -6.3011474609375, -5.908935546875, -5.5167236328125, -5.12451171875, -4.7322998046875, -4.340087890625, -3.9478759765625, -3.5556640625, -3.1634521484375, -2.771240234375, -2.3790283203125, -1.98681640625, -1.5946044921875, -1.202392578125, -0.8101806640625, -0.41796875, -0.0257568359375, 0.366455078125, 0.7586669921875, 1.15087890625, 1.5430908203125, 1.935302734375, 2.3275146484375, 2.7197265625, 3.1119384765625, 3.504150390625, 3.8963623046875, 4.28857421875, 4.6807861328125, 5.072998046875, 5.4652099609375, 5.857421875, 6.2496337890625, 6.641845703125, 7.0340576171875, 7.42626953125, 7.8184814453125, 8.210693359375, 8.6029052734375, 8.9951171875, 9.3873291015625, 9.779541015625, 10.1717529296875, 10.56396484375, 10.9561767578125, 11.348388671875, 11.7406005859375, 12.1328125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 4.0, 6.0, 6.0, 9.0, 13.0, 27.0, 25.0, 47.0, 38.0, 53.0, 66.0, 98.0, 111.0, 87.0, 78.0, 79.0, 55.0, 44.0, 40.0, 20.0, 21.0, 18.0, 4.0, 6.0, 12.0, 9.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.7734375, -9.5003662109375, -9.227294921875, -8.9542236328125, -8.68115234375, -8.4080810546875, -8.135009765625, -7.8619384765625, -7.5888671875, -7.3157958984375, -7.042724609375, -6.7696533203125, -6.49658203125, -6.2235107421875, -5.950439453125, -5.6773681640625, -5.404296875, -5.1312255859375, -4.858154296875, -4.5850830078125, -4.31201171875, -4.0389404296875, -3.765869140625, -3.4927978515625, -3.2197265625, -2.9466552734375, -2.673583984375, -2.4005126953125, -2.12744140625, -1.8543701171875, -1.581298828125, -1.3082275390625, -1.03515625, -0.7620849609375, -0.489013671875, -0.2159423828125, 0.05712890625, 0.3302001953125, 0.603271484375, 0.8763427734375, 1.1494140625, 1.4224853515625, 1.695556640625, 1.9686279296875, 2.24169921875, 2.5147705078125, 2.787841796875, 3.0609130859375, 3.333984375, 3.6070556640625, 3.880126953125, 4.1531982421875, 4.42626953125, 4.6993408203125, 4.972412109375, 5.2454833984375, 5.5185546875, 5.7916259765625, 6.064697265625, 6.3377685546875, 6.61083984375, 6.8839111328125, 7.156982421875, 7.4300537109375, 7.703125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 31.0, 36.0, 52.0, 71.0, 101.0, 108.0, 125.0, 128.0, 102.0, 76.0, 58.0, 28.0, 19.0, 17.0, 13.0, 10.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.25979614257812, -118.14527893066406, -114.03075408935547, -109.91622924804688, -105.80171203613281, -101.68719482421875, -97.57266998291016, -93.45814514160156, -89.3436279296875, -85.22911071777344, -81.11458587646484, -77.00006103515625, -72.88554382324219, -68.77102661132812, -64.65650177001953, -60.5419807434082, -56.427459716796875, -52.31293869018555, -48.19841766357422, -44.08389663696289, -39.96937561035156, -35.854854583740234, -31.740333557128906, -27.625812530517578, -23.51129150390625, -19.396770477294922, -15.282249450683594, -11.167728424072266, -7.0532073974609375, -2.9386863708496094, 1.1758346557617188, 5.290355682373047, 9.404861450195312, 13.51938247680664, 17.63390350341797, 21.748424530029297, 25.862945556640625, 29.977466583251953, 34.09198760986328, 38.20650863647461, 42.32102966308594, 46.435550689697266, 50.550071716308594, 54.66459274291992, 58.77911376953125, 62.89363479614258, 67.0081558227539, 71.1226806640625, 75.23719787597656, 79.35171508789062, 83.46623992919922, 87.58076477050781, 91.69528198242188, 95.80979919433594, 99.92432403564453, 104.03884887695312, 108.15336608886719, 112.26788330078125, 116.38240814208984, 120.49693298339844, 124.6114501953125, 128.72596740722656, 132.84048461914062, 136.95501708984375, 141.0695343017578]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 9.0, 15.0, 10.0, 17.0, 9.0, 19.0, 17.0, 22.0, 14.0, 28.0, 31.0, 35.0, 35.0, 42.0, 48.0, 48.0, 33.0, 39.0, 46.0, 41.0, 40.0, 36.0, 36.0, 32.0, 36.0, 41.0, 35.0, 35.0, 15.0, 18.0, 13.0, 21.0, 13.0, 14.0, 13.0, 8.0, 5.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-70.58682250976562, -68.28035736083984, -65.97389221191406, -63.66742706298828, -61.3609619140625, -59.05449676513672, -56.74803161621094, -54.441566467285156, -52.135101318359375, -49.828636169433594, -47.52217102050781, -45.21570587158203, -42.90924072265625, -40.60277557373047, -38.29631042480469, -35.989845275878906, -33.683380126953125, -31.376914978027344, -29.070449829101562, -26.76398468017578, -24.45751953125, -22.15105438232422, -19.844589233398438, -17.538124084472656, -15.231658935546875, -12.925193786621094, -10.618728637695312, -8.312263488769531, -6.00579833984375, -3.6993331909179688, -1.3928680419921875, 0.9135971069335938, 3.220062255859375, 5.526527404785156, 7.8329925537109375, 10.139457702636719, 12.4459228515625, 14.752388000488281, 17.058853149414062, 19.365318298339844, 21.671783447265625, 23.978248596191406, 26.284713745117188, 28.59117889404297, 30.89764404296875, 33.20410919189453, 35.51057434082031, 37.817039489746094, 40.123504638671875, 42.429969787597656, 44.73643493652344, 47.04290008544922, 49.349365234375, 51.65583038330078, 53.96229553222656, 56.268760681152344, 58.575225830078125, 60.881690979003906, 63.18815612792969, 65.49462127685547, 67.80108642578125, 70.10755157470703, 72.41401672363281, 74.7204818725586, 77.02694702148438]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 10.0, 16.0, 26.0, 40.0, 94.0, 133.0, 242.0, 478.0, 947.0, 1924.0, 4829.0, 11601.0, 31725.0, 99929.0, 459119.0, 3116531.0, 342070.0, 81025.0, 26222.0, 9637.0, 4027.0, 1787.0, 869.0, 443.0, 208.0, 143.0, 78.0, 47.0, 28.0, 16.0, 21.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.546875, -21.891845703125, -21.23681640625, -20.581787109375, -19.9267578125, -19.271728515625, -18.61669921875, -17.961669921875, -17.306640625, -16.651611328125, -15.99658203125, -15.341552734375, -14.6865234375, -14.031494140625, -13.37646484375, -12.721435546875, -12.06640625, -11.411376953125, -10.75634765625, -10.101318359375, -9.4462890625, -8.791259765625, -8.13623046875, -7.481201171875, -6.826171875, -6.171142578125, -5.51611328125, -4.861083984375, -4.2060546875, -3.551025390625, -2.89599609375, -2.240966796875, -1.5859375, -0.930908203125, -0.27587890625, 0.379150390625, 1.0341796875, 1.689208984375, 2.34423828125, 2.999267578125, 3.654296875, 4.309326171875, 4.96435546875, 5.619384765625, 6.2744140625, 6.929443359375, 7.58447265625, 8.239501953125, 8.89453125, 9.549560546875, 10.20458984375, 10.859619140625, 11.5146484375, 12.169677734375, 12.82470703125, 13.479736328125, 14.134765625, 14.789794921875, 15.44482421875, 16.099853515625, 16.7548828125, 17.409912109375, 18.06494140625, 18.719970703125, 19.375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 11.0, 5.0, 16.0, 12.0, 21.0, 14.0, 20.0, 18.0, 18.0, 20.0, 25.0, 37.0, 42.0, 37.0, 42.0, 43.0, 37.0, 35.0, 41.0, 43.0, 52.0, 42.0, 33.0, 42.0, 42.0, 30.0, 30.0, 30.0, 26.0, 17.0, 21.0, 12.0, 14.0, 12.0, 12.0, 8.0, 6.0, 4.0, 5.0, 8.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.87890625, -2.793609619140625, -2.70831298828125, -2.623016357421875, -2.5377197265625, -2.452423095703125, -2.36712646484375, -2.281829833984375, -2.196533203125, -2.111236572265625, -2.02593994140625, -1.940643310546875, -1.8553466796875, -1.770050048828125, -1.68475341796875, -1.599456787109375, -1.51416015625, -1.428863525390625, -1.34356689453125, -1.258270263671875, -1.1729736328125, -1.087677001953125, -1.00238037109375, -0.917083740234375, -0.831787109375, -0.746490478515625, -0.66119384765625, -0.575897216796875, -0.4906005859375, -0.405303955078125, -0.32000732421875, -0.234710693359375, -0.1494140625, -0.064117431640625, 0.02117919921875, 0.106475830078125, 0.1917724609375, 0.277069091796875, 0.36236572265625, 0.447662353515625, 0.532958984375, 0.618255615234375, 0.70355224609375, 0.788848876953125, 0.8741455078125, 0.959442138671875, 1.04473876953125, 1.130035400390625, 1.21533203125, 1.300628662109375, 1.38592529296875, 1.471221923828125, 1.5565185546875, 1.641815185546875, 1.72711181640625, 1.812408447265625, 1.897705078125, 1.983001708984375, 2.06829833984375, 2.153594970703125, 2.2388916015625, 2.324188232421875, 2.40948486328125, 2.494781494140625, 2.580078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 13.0, 10.0, 13.0, 18.0, 29.0, 44.0, 53.0, 85.0, 127.0, 210.0, 340.0, 604.0, 1260.0, 2433.0, 5110.0, 11907.0, 28986.0, 81917.0, 280930.0, 2094758.0, 1335884.0, 233331.0, 70664.0, 25638.0, 10447.0, 4604.0, 2219.0, 1179.0, 598.0, 325.0, 193.0, 116.0, 77.0, 42.0, 36.0, 26.0, 12.0, 10.0, 13.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.796875, -17.239501953125, -16.68212890625, -16.124755859375, -15.5673828125, -15.010009765625, -14.45263671875, -13.895263671875, -13.337890625, -12.780517578125, -12.22314453125, -11.665771484375, -11.1083984375, -10.551025390625, -9.99365234375, -9.436279296875, -8.87890625, -8.321533203125, -7.76416015625, -7.206787109375, -6.6494140625, -6.092041015625, -5.53466796875, -4.977294921875, -4.419921875, -3.862548828125, -3.30517578125, -2.747802734375, -2.1904296875, -1.633056640625, -1.07568359375, -0.518310546875, 0.0390625, 0.596435546875, 1.15380859375, 1.711181640625, 2.2685546875, 2.825927734375, 3.38330078125, 3.940673828125, 4.498046875, 5.055419921875, 5.61279296875, 6.170166015625, 6.7275390625, 7.284912109375, 7.84228515625, 8.399658203125, 8.95703125, 9.514404296875, 10.07177734375, 10.629150390625, 11.1865234375, 11.743896484375, 12.30126953125, 12.858642578125, 13.416015625, 13.973388671875, 14.53076171875, 15.088134765625, 15.6455078125, 16.202880859375, 16.76025390625, 17.317626953125, 17.875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 6.0, 6.0, 7.0, 11.0, 25.0, 24.0, 28.0, 45.0, 42.0, 79.0, 92.0, 115.0, 179.0, 239.0, 412.0, 966.0, 612.0, 365.0, 223.0, 157.0, 105.0, 76.0, 51.0, 49.0, 31.0, 23.0, 22.0, 21.0, 13.0, 12.0, 10.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.078125, -6.8402099609375, -6.602294921875, -6.3643798828125, -6.12646484375, -5.8885498046875, -5.650634765625, -5.4127197265625, -5.1748046875, -4.9368896484375, -4.698974609375, -4.4610595703125, -4.22314453125, -3.9852294921875, -3.747314453125, -3.5093994140625, -3.271484375, -3.0335693359375, -2.795654296875, -2.5577392578125, -2.31982421875, -2.0819091796875, -1.843994140625, -1.6060791015625, -1.3681640625, -1.1302490234375, -0.892333984375, -0.6544189453125, -0.41650390625, -0.1785888671875, 0.059326171875, 0.2972412109375, 0.53515625, 0.7730712890625, 1.010986328125, 1.2489013671875, 1.48681640625, 1.7247314453125, 1.962646484375, 2.2005615234375, 2.4384765625, 2.6763916015625, 2.914306640625, 3.1522216796875, 3.39013671875, 3.6280517578125, 3.865966796875, 4.1038818359375, 4.341796875, 4.5797119140625, 4.817626953125, 5.0555419921875, 5.29345703125, 5.5313720703125, 5.769287109375, 6.0072021484375, 6.2451171875, 6.4830322265625, 6.720947265625, 6.9588623046875, 7.19677734375, 7.4346923828125, 7.672607421875, 7.9105224609375, 8.1484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 10.0, 12.0, 34.0, 61.0, 77.0, 145.0, 174.0, 152.0, 131.0, 90.0, 44.0, 24.0, 23.0, 12.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.36531066894531, -54.29949951171875, -51.23368453979492, -48.167869567871094, -45.10205841064453, -42.03624725341797, -38.97043228149414, -35.90461730957031, -32.83880615234375, -29.772993087768555, -26.70718002319336, -23.641366958618164, -20.57555389404297, -17.509740829467773, -14.443927764892578, -11.378114700317383, -8.312301635742188, -5.246488571166992, -2.180675506591797, 0.8851375579833984, 3.9509506225585938, 7.016763687133789, 10.082576751708984, 13.14838981628418, 16.214202880859375, 19.28001594543457, 22.345829010009766, 25.41164207458496, 28.477455139160156, 31.54326820373535, 34.60908126831055, 37.674896240234375, 40.74070739746094, 43.8065185546875, 46.87233352661133, 49.938148498535156, 53.00395965576172, 56.06977081298828, 59.13558578491211, 62.20140075683594, 65.2672119140625, 68.33302307128906, 71.39883422851562, 74.46465301513672, 77.53046417236328, 80.59627532958984, 83.66209411621094, 86.7279052734375, 89.79371643066406, 92.85952758789062, 95.92533874511719, 98.99115753173828, 102.05696868896484, 105.1227798461914, 108.1885986328125, 111.25440979003906, 114.32022094726562, 117.38603210449219, 120.45184326171875, 123.51766204833984, 126.5834732055664, 129.6492919921875, 132.71510314941406, 135.78091430664062, 138.8467254638672]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 8.0, 7.0, 11.0, 6.0, 13.0, 17.0, 13.0, 23.0, 16.0, 12.0, 34.0, 28.0, 32.0, 25.0, 36.0, 31.0, 28.0, 33.0, 38.0, 37.0, 39.0, 35.0, 39.0, 34.0, 39.0, 30.0, 29.0, 27.0, 38.0, 25.0, 23.0, 28.0, 26.0, 26.0, 13.0, 15.0, 12.0, 10.0, 13.0, 11.0, 9.0, 7.0, 5.0, 3.0, 9.0, 2.0, 6.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.857507705688477, -28.95193099975586, -28.046356201171875, -27.14078140258789, -26.235204696655273, -25.329627990722656, -24.424053192138672, -23.518478393554688, -22.61290168762207, -21.707324981689453, -20.80175018310547, -19.896175384521484, -18.990598678588867, -18.08502197265625, -17.179447174072266, -16.27387237548828, -15.368295669555664, -14.462719917297363, -13.557144165039062, -12.651568412780762, -11.745992660522461, -10.84041690826416, -9.93484115600586, -9.029265403747559, -8.123689651489258, -7.218113899230957, -6.312538146972656, -5.4069623947143555, -4.501386642456055, -3.595810890197754, -2.690235137939453, -1.7846593856811523, -0.8790817260742188, 0.02649402618408203, 0.9320697784423828, 1.8376455307006836, 2.7432212829589844, 3.648797035217285, 4.554372787475586, 5.459948539733887, 6.3655242919921875, 7.271100044250488, 8.176675796508789, 9.08225154876709, 9.98782730102539, 10.893403053283691, 11.798978805541992, 12.704554557800293, 13.610130310058594, 14.515706062316895, 15.421281814575195, 16.326858520507812, 17.232433319091797, 18.13800811767578, 19.0435848236084, 19.949161529541016, 20.854736328125, 21.760311126708984, 22.6658878326416, 23.57146453857422, 24.477039337158203, 25.382614135742188, 26.288190841674805, 27.193767547607422, 28.099342346191406]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 7.0, 8.0, 21.0, 27.0, 28.0, 45.0, 104.0, 172.0, 316.0, 664.0, 1453.0, 3569.0, 9208.0, 23927.0, 65817.0, 188892.0, 438502.0, 203520.0, 70129.0, 25854.0, 9497.0, 3770.0, 1586.0, 671.0, 335.0, 177.0, 85.0, 52.0, 40.0, 23.0, 21.0, 9.0, 9.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 3.0], "bins": [-29.46875, -28.74169921875, -28.0146484375, -27.28759765625, -26.560546875, -25.83349609375, -25.1064453125, -24.37939453125, -23.65234375, -22.92529296875, -22.1982421875, -21.47119140625, -20.744140625, -20.01708984375, -19.2900390625, -18.56298828125, -17.8359375, -17.10888671875, -16.3818359375, -15.65478515625, -14.927734375, -14.20068359375, -13.4736328125, -12.74658203125, -12.01953125, -11.29248046875, -10.5654296875, -9.83837890625, -9.111328125, -8.38427734375, -7.6572265625, -6.93017578125, -6.203125, -5.47607421875, -4.7490234375, -4.02197265625, -3.294921875, -2.56787109375, -1.8408203125, -1.11376953125, -0.38671875, 0.34033203125, 1.0673828125, 1.79443359375, 2.521484375, 3.24853515625, 3.9755859375, 4.70263671875, 5.4296875, 6.15673828125, 6.8837890625, 7.61083984375, 8.337890625, 9.06494140625, 9.7919921875, 10.51904296875, 11.24609375, 11.97314453125, 12.7001953125, 13.42724609375, 14.154296875, 14.88134765625, 15.6083984375, 16.33544921875, 17.0625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 9.0, 4.0, 11.0, 21.0, 16.0, 18.0, 27.0, 17.0, 19.0, 31.0, 27.0, 38.0, 46.0, 44.0, 50.0, 45.0, 37.0, 51.0, 49.0, 54.0, 55.0, 44.0, 34.0, 32.0, 30.0, 27.0, 29.0, 22.0, 21.0, 15.0, 17.0, 16.0, 8.0, 9.0, 7.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.115234375, -3.01849365234375, -2.9217529296875, -2.82501220703125, -2.728271484375, -2.63153076171875, -2.5347900390625, -2.43804931640625, -2.34130859375, -2.24456787109375, -2.1478271484375, -2.05108642578125, -1.954345703125, -1.85760498046875, -1.7608642578125, -1.66412353515625, -1.5673828125, -1.47064208984375, -1.3739013671875, -1.27716064453125, -1.180419921875, -1.08367919921875, -0.9869384765625, -0.89019775390625, -0.79345703125, -0.69671630859375, -0.5999755859375, -0.50323486328125, -0.406494140625, -0.30975341796875, -0.2130126953125, -0.11627197265625, -0.01953125, 0.07720947265625, 0.1739501953125, 0.27069091796875, 0.367431640625, 0.46417236328125, 0.5609130859375, 0.65765380859375, 0.75439453125, 0.85113525390625, 0.9478759765625, 1.04461669921875, 1.141357421875, 1.23809814453125, 1.3348388671875, 1.43157958984375, 1.5283203125, 1.62506103515625, 1.7218017578125, 1.81854248046875, 1.915283203125, 2.01202392578125, 2.1087646484375, 2.20550537109375, 2.30224609375, 2.39898681640625, 2.4957275390625, 2.59246826171875, 2.689208984375, 2.78594970703125, 2.8826904296875, 2.97943115234375, 3.076171875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 10.0, 15.0, 20.0, 26.0, 37.0, 52.0, 85.0, 185.0, 255.0, 437.0, 844.0, 1746.0, 3624.0, 8766.0, 27102.0, 99183.0, 406881.0, 370137.0, 89404.0, 24399.0, 8390.0, 3325.0, 1682.0, 813.0, 431.0, 262.0, 146.0, 103.0, 63.0, 30.0, 27.0, 14.0, 13.0, 7.0, 10.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0, -20.27490234375, -19.5498046875, -18.82470703125, -18.099609375, -17.37451171875, -16.6494140625, -15.92431640625, -15.19921875, -14.47412109375, -13.7490234375, -13.02392578125, -12.298828125, -11.57373046875, -10.8486328125, -10.12353515625, -9.3984375, -8.67333984375, -7.9482421875, -7.22314453125, -6.498046875, -5.77294921875, -5.0478515625, -4.32275390625, -3.59765625, -2.87255859375, -2.1474609375, -1.42236328125, -0.697265625, 0.02783203125, 0.7529296875, 1.47802734375, 2.203125, 2.92822265625, 3.6533203125, 4.37841796875, 5.103515625, 5.82861328125, 6.5537109375, 7.27880859375, 8.00390625, 8.72900390625, 9.4541015625, 10.17919921875, 10.904296875, 11.62939453125, 12.3544921875, 13.07958984375, 13.8046875, 14.52978515625, 15.2548828125, 15.97998046875, 16.705078125, 17.43017578125, 18.1552734375, 18.88037109375, 19.60546875, 20.33056640625, 21.0556640625, 21.78076171875, 22.505859375, 23.23095703125, 23.9560546875, 24.68115234375, 25.40625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 8.0, 5.0, 11.0, 8.0, 12.0, 7.0, 17.0, 10.0, 24.0, 25.0, 27.0, 37.0, 44.0, 36.0, 42.0, 53.0, 53.0, 51.0, 54.0, 48.0, 44.0, 48.0, 38.0, 42.0, 44.0, 33.0, 23.0, 23.0, 27.0, 20.0, 11.0, 14.0, 18.0, 7.0, 7.0, 10.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.1875, -16.69091796875, -16.1943359375, -15.69775390625, -15.201171875, -14.70458984375, -14.2080078125, -13.71142578125, -13.21484375, -12.71826171875, -12.2216796875, -11.72509765625, -11.228515625, -10.73193359375, -10.2353515625, -9.73876953125, -9.2421875, -8.74560546875, -8.2490234375, -7.75244140625, -7.255859375, -6.75927734375, -6.2626953125, -5.76611328125, -5.26953125, -4.77294921875, -4.2763671875, -3.77978515625, -3.283203125, -2.78662109375, -2.2900390625, -1.79345703125, -1.296875, -0.80029296875, -0.3037109375, 0.19287109375, 0.689453125, 1.18603515625, 1.6826171875, 2.17919921875, 2.67578125, 3.17236328125, 3.6689453125, 4.16552734375, 4.662109375, 5.15869140625, 5.6552734375, 6.15185546875, 6.6484375, 7.14501953125, 7.6416015625, 8.13818359375, 8.634765625, 9.13134765625, 9.6279296875, 10.12451171875, 10.62109375, 11.11767578125, 11.6142578125, 12.11083984375, 12.607421875, 13.10400390625, 13.6005859375, 14.09716796875, 14.59375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 6.0, 7.0, 12.0, 20.0, 26.0, 31.0, 65.0, 104.0, 207.0, 375.0, 800.0, 1700.0, 4040.0, 10715.0, 34493.0, 150490.0, 586109.0, 196210.0, 41933.0, 12602.0, 4753.0, 2001.0, 865.0, 462.0, 223.0, 107.0, 80.0, 42.0, 20.0, 17.0, 9.0, 5.0, 8.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.796875, -18.282958984375, -17.76904296875, -17.255126953125, -16.7412109375, -16.227294921875, -15.71337890625, -15.199462890625, -14.685546875, -14.171630859375, -13.65771484375, -13.143798828125, -12.6298828125, -12.115966796875, -11.60205078125, -11.088134765625, -10.57421875, -10.060302734375, -9.54638671875, -9.032470703125, -8.5185546875, -8.004638671875, -7.49072265625, -6.976806640625, -6.462890625, -5.948974609375, -5.43505859375, -4.921142578125, -4.4072265625, -3.893310546875, -3.37939453125, -2.865478515625, -2.3515625, -1.837646484375, -1.32373046875, -0.809814453125, -0.2958984375, 0.218017578125, 0.73193359375, 1.245849609375, 1.759765625, 2.273681640625, 2.78759765625, 3.301513671875, 3.8154296875, 4.329345703125, 4.84326171875, 5.357177734375, 5.87109375, 6.385009765625, 6.89892578125, 7.412841796875, 7.9267578125, 8.440673828125, 8.95458984375, 9.468505859375, 9.982421875, 10.496337890625, 11.01025390625, 11.524169921875, 12.0380859375, 12.552001953125, 13.06591796875, 13.579833984375, 14.09375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 0.0, 6.0, 5.0, 9.0, 15.0, 23.0, 36.0, 60.0, 99.0, 224.0, 255.0, 99.0, 69.0, 23.0, 22.0, 20.0, 15.0, 8.0, 2.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006664276123046875, -0.006501883268356323, -0.0063394904136657715, -0.00617709755897522, -0.006014704704284668, -0.005852311849594116, -0.0056899189949035645, -0.005527526140213013, -0.005365133285522461, -0.005202740430831909, -0.005040347576141357, -0.004877954721450806, -0.004715561866760254, -0.004553169012069702, -0.00439077615737915, -0.004228383302688599, -0.004065990447998047, -0.003903597593307495, -0.0037412047386169434, -0.0035788118839263916, -0.00341641902923584, -0.003254026174545288, -0.0030916333198547363, -0.0029292404651641846, -0.002766847610473633, -0.002604454755783081, -0.0024420619010925293, -0.0022796690464019775, -0.0021172761917114258, -0.001954883337020874, -0.0017924904823303223, -0.0016300976276397705, -0.0014677047729492188, -0.001305311918258667, -0.0011429190635681152, -0.0009805262088775635, -0.0008181333541870117, -0.00065574049949646, -0.0004933476448059082, -0.00033095479011535645, -0.0001685619354248047, -6.16908073425293e-06, 0.00015622377395629883, 0.0003186166286468506, 0.00048100948333740234, 0.0006434023380279541, 0.0008057951927185059, 0.0009681880474090576, 0.0011305809020996094, 0.0012929737567901611, 0.0014553666114807129, 0.0016177594661712646, 0.0017801523208618164, 0.0019425451755523682, 0.00210493803024292, 0.0022673308849334717, 0.0024297237396240234, 0.002592116594314575, 0.002754509449005127, 0.0029169023036956787, 0.0030792951583862305, 0.0032416880130767822, 0.003404080867767334, 0.0035664737224578857, 0.0037288665771484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 9.0, 13.0, 14.0, 22.0, 19.0, 30.0, 43.0, 72.0, 98.0, 174.0, 271.0, 485.0, 806.0, 1587.0, 3156.0, 6305.0, 14018.0, 34730.0, 105722.0, 406004.0, 335565.0, 85603.0, 29774.0, 12403.0, 5553.0, 2771.0, 1422.0, 711.0, 449.0, 219.0, 169.0, 81.0, 65.0, 49.0, 46.0, 26.0, 20.0, 8.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 4.0], "bins": [-13.0, -12.6380615234375, -12.276123046875, -11.9141845703125, -11.55224609375, -11.1903076171875, -10.828369140625, -10.4664306640625, -10.1044921875, -9.7425537109375, -9.380615234375, -9.0186767578125, -8.65673828125, -8.2947998046875, -7.932861328125, -7.5709228515625, -7.208984375, -6.8470458984375, -6.485107421875, -6.1231689453125, -5.76123046875, -5.3992919921875, -5.037353515625, -4.6754150390625, -4.3134765625, -3.9515380859375, -3.589599609375, -3.2276611328125, -2.86572265625, -2.5037841796875, -2.141845703125, -1.7799072265625, -1.41796875, -1.0560302734375, -0.694091796875, -0.3321533203125, 0.02978515625, 0.3917236328125, 0.753662109375, 1.1156005859375, 1.4775390625, 1.8394775390625, 2.201416015625, 2.5633544921875, 2.92529296875, 3.2872314453125, 3.649169921875, 4.0111083984375, 4.373046875, 4.7349853515625, 5.096923828125, 5.4588623046875, 5.82080078125, 6.1827392578125, 6.544677734375, 6.9066162109375, 7.2685546875, 7.6304931640625, 7.992431640625, 8.3543701171875, 8.71630859375, 9.0782470703125, 9.440185546875, 9.8021240234375, 10.1640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 2.0, 4.0, 4.0, 5.0, 6.0, 3.0, 7.0, 10.0, 12.0, 16.0, 21.0, 22.0, 24.0, 25.0, 42.0, 42.0, 88.0, 95.0, 105.0, 82.0, 84.0, 72.0, 59.0, 25.0, 21.0, 23.0, 19.0, 11.0, 8.0, 6.0, 9.0, 10.0, 5.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.85546875, -7.57196044921875, -7.2884521484375, -7.00494384765625, -6.721435546875, -6.43792724609375, -6.1544189453125, -5.87091064453125, -5.58740234375, -5.30389404296875, -5.0203857421875, -4.73687744140625, -4.453369140625, -4.16986083984375, -3.8863525390625, -3.60284423828125, -3.3193359375, -3.03582763671875, -2.7523193359375, -2.46881103515625, -2.185302734375, -1.90179443359375, -1.6182861328125, -1.33477783203125, -1.05126953125, -0.76776123046875, -0.4842529296875, -0.20074462890625, 0.082763671875, 0.36627197265625, 0.6497802734375, 0.93328857421875, 1.216796875, 1.50030517578125, 1.7838134765625, 2.06732177734375, 2.350830078125, 2.63433837890625, 2.9178466796875, 3.20135498046875, 3.48486328125, 3.76837158203125, 4.0518798828125, 4.33538818359375, 4.618896484375, 4.90240478515625, 5.1859130859375, 5.46942138671875, 5.7529296875, 6.03643798828125, 6.3199462890625, 6.60345458984375, 6.886962890625, 7.17047119140625, 7.4539794921875, 7.73748779296875, 8.02099609375, 8.30450439453125, 8.5880126953125, 8.87152099609375, 9.155029296875, 9.43853759765625, 9.7220458984375, 10.00555419921875, 10.2890625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 9.0, 14.0, 27.0, 23.0, 30.0, 45.0, 60.0, 65.0, 82.0, 98.0, 96.0, 87.0, 75.0, 81.0, 53.0, 45.0, 28.0, 22.0, 18.0, 12.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.95111083984375, -107.02330017089844, -103.09548950195312, -99.16767883300781, -95.2398681640625, -91.31205749511719, -87.3842544555664, -83.4564437866211, -79.52863311767578, -75.60082244873047, -71.67301177978516, -67.74520111083984, -63.8173942565918, -59.889583587646484, -55.96177673339844, -52.033966064453125, -48.10615539550781, -44.1783447265625, -40.25053405761719, -36.32272720336914, -32.39491653442383, -28.467105865478516, -24.539297103881836, -20.611488342285156, -16.683677673339844, -12.755867958068848, -8.828058242797852, -4.9002485275268555, -0.9724388122558594, 2.955371856689453, 6.883180618286133, 10.810989379882812, 14.738800048828125, 18.666610717773438, 22.594419479370117, 26.522228240966797, 30.45003890991211, 34.37784957885742, 38.30565643310547, 42.23346710205078, 46.161277770996094, 50.089088439941406, 54.01689910888672, 57.944705963134766, 61.87251663208008, 65.80032348632812, 69.72813415527344, 73.65594482421875, 77.58375549316406, 81.51156616210938, 85.43937683105469, 89.3671875, 93.29499816894531, 97.22280883789062, 101.1506118774414, 105.07842254638672, 109.00623321533203, 112.93404388427734, 116.86185455322266, 120.78966522216797, 124.71746826171875, 128.64527893066406, 132.57308959960938, 136.5009002685547, 140.4287109375]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 9.0, 8.0, 8.0, 6.0, 13.0, 13.0, 22.0, 13.0, 21.0, 23.0, 26.0, 24.0, 27.0, 28.0, 36.0, 48.0, 37.0, 37.0, 36.0, 38.0, 38.0, 33.0, 43.0, 32.0, 27.0, 35.0, 28.0, 18.0, 26.0, 39.0, 20.0, 17.0, 26.0, 15.0, 17.0, 20.0, 7.0, 16.0, 9.0, 6.0, 7.0, 9.0, 6.0, 7.0, 5.0, 2.0, 4.0, 6.0, 0.0, 1.0, 1.0, 2.0], "bins": [-78.81031799316406, -76.43183135986328, -74.0533447265625, -71.67485809326172, -69.29637145996094, -66.91789245605469, -64.5394058227539, -62.160919189453125, -59.782432556152344, -57.40394592285156, -55.02545928955078, -52.646976470947266, -50.268489837646484, -47.8900032043457, -45.51152038574219, -43.133033752441406, -40.754547119140625, -38.376060485839844, -35.99757385253906, -33.61909103393555, -31.240604400634766, -28.862117767333984, -26.483633041381836, -24.105148315429688, -21.726661682128906, -19.348175048828125, -16.969690322875977, -14.591204643249512, -12.212718963623047, -9.834233283996582, -7.455747604370117, -5.077262878417969, -2.6987838745117188, -0.3202981948852539, 2.058187484741211, 4.436673164367676, 6.815158843994141, 9.193644523620605, 11.57213020324707, 13.950614929199219, 16.3291015625, 18.70758819580078, 21.08607292175293, 23.464557647705078, 25.84304428100586, 28.22153091430664, 30.60001564025879, 32.97850036621094, 35.35698699951172, 37.7354736328125, 40.11396026611328, 42.4924430847168, 44.87092971801758, 47.24941635131836, 49.627899169921875, 52.006385803222656, 54.38487243652344, 56.76335906982422, 59.141845703125, 61.520328521728516, 63.8988151550293, 66.27729797363281, 68.6557846069336, 71.03427124023438, 73.41275787353516]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 12.0, 21.0, 28.0, 49.0, 65.0, 136.0, 238.0, 432.0, 902.0, 2051.0, 4623.0, 11854.0, 34741.0, 125666.0, 1302435.0, 2506817.0, 143446.0, 38562.0, 13057.0, 5039.0, 2079.0, 955.0, 445.0, 257.0, 151.0, 83.0, 51.0, 33.0, 18.0, 14.0, 3.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 3.0], "bins": [-30.0, -29.26904296875, -28.5380859375, -27.80712890625, -27.076171875, -26.34521484375, -25.6142578125, -24.88330078125, -24.15234375, -23.42138671875, -22.6904296875, -21.95947265625, -21.228515625, -20.49755859375, -19.7666015625, -19.03564453125, -18.3046875, -17.57373046875, -16.8427734375, -16.11181640625, -15.380859375, -14.64990234375, -13.9189453125, -13.18798828125, -12.45703125, -11.72607421875, -10.9951171875, -10.26416015625, -9.533203125, -8.80224609375, -8.0712890625, -7.34033203125, -6.609375, -5.87841796875, -5.1474609375, -4.41650390625, -3.685546875, -2.95458984375, -2.2236328125, -1.49267578125, -0.76171875, -0.03076171875, 0.7001953125, 1.43115234375, 2.162109375, 2.89306640625, 3.6240234375, 4.35498046875, 5.0859375, 5.81689453125, 6.5478515625, 7.27880859375, 8.009765625, 8.74072265625, 9.4716796875, 10.20263671875, 10.93359375, 11.66455078125, 12.3955078125, 13.12646484375, 13.857421875, 14.58837890625, 15.3193359375, 16.05029296875, 16.78125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 9.0, 9.0, 7.0, 12.0, 14.0, 15.0, 17.0, 17.0, 17.0, 22.0, 21.0, 17.0, 43.0, 37.0, 21.0, 41.0, 45.0, 45.0, 41.0, 41.0, 44.0, 43.0, 39.0, 41.0, 41.0, 44.0, 31.0, 31.0, 32.0, 27.0, 24.0, 10.0, 15.0, 23.0, 18.0, 7.0, 8.0, 10.0, 11.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2109375, -3.10711669921875, -3.0032958984375, -2.89947509765625, -2.795654296875, -2.69183349609375, -2.5880126953125, -2.48419189453125, -2.38037109375, -2.27655029296875, -2.1727294921875, -2.06890869140625, -1.965087890625, -1.86126708984375, -1.7574462890625, -1.65362548828125, -1.5498046875, -1.44598388671875, -1.3421630859375, -1.23834228515625, -1.134521484375, -1.03070068359375, -0.9268798828125, -0.82305908203125, -0.71923828125, -0.61541748046875, -0.5115966796875, -0.40777587890625, -0.303955078125, -0.20013427734375, -0.0963134765625, 0.00750732421875, 0.111328125, 0.21514892578125, 0.3189697265625, 0.42279052734375, 0.526611328125, 0.63043212890625, 0.7342529296875, 0.83807373046875, 0.94189453125, 1.04571533203125, 1.1495361328125, 1.25335693359375, 1.357177734375, 1.46099853515625, 1.5648193359375, 1.66864013671875, 1.7724609375, 1.87628173828125, 1.9801025390625, 2.08392333984375, 2.187744140625, 2.29156494140625, 2.3953857421875, 2.49920654296875, 2.60302734375, 2.70684814453125, 2.8106689453125, 2.91448974609375, 3.018310546875, 3.12213134765625, 3.2259521484375, 3.32977294921875, 3.43359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 7.0, 14.0, 15.0, 22.0, 31.0, 43.0, 68.0, 98.0, 149.0, 259.0, 427.0, 744.0, 1233.0, 2214.0, 4290.0, 8684.0, 19251.0, 48349.0, 149153.0, 809484.0, 2738231.0, 279888.0, 77355.0, 29097.0, 12361.0, 5882.0, 2997.0, 1623.0, 977.0, 491.0, 288.0, 208.0, 111.0, 95.0, 49.0, 32.0, 25.0, 15.0, 9.0, 9.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.875, -18.181640625, -17.48828125, -16.794921875, -16.1015625, -15.408203125, -14.71484375, -14.021484375, -13.328125, -12.634765625, -11.94140625, -11.248046875, -10.5546875, -9.861328125, -9.16796875, -8.474609375, -7.78125, -7.087890625, -6.39453125, -5.701171875, -5.0078125, -4.314453125, -3.62109375, -2.927734375, -2.234375, -1.541015625, -0.84765625, -0.154296875, 0.5390625, 1.232421875, 1.92578125, 2.619140625, 3.3125, 4.005859375, 4.69921875, 5.392578125, 6.0859375, 6.779296875, 7.47265625, 8.166015625, 8.859375, 9.552734375, 10.24609375, 10.939453125, 11.6328125, 12.326171875, 13.01953125, 13.712890625, 14.40625, 15.099609375, 15.79296875, 16.486328125, 17.1796875, 17.873046875, 18.56640625, 19.259765625, 19.953125, 20.646484375, 21.33984375, 22.033203125, 22.7265625, 23.419921875, 24.11328125, 24.806640625, 25.5]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 6.0, 2.0, 7.0, 8.0, 9.0, 11.0, 9.0, 20.0, 20.0, 33.0, 41.0, 78.0, 105.0, 164.0, 254.0, 507.0, 1339.0, 618.0, 254.0, 175.0, 121.0, 71.0, 51.0, 37.0, 29.0, 25.0, 22.0, 11.0, 11.0, 10.0, 2.0, 7.0, 6.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.1953125, -8.894775390625, -8.59423828125, -8.293701171875, -7.9931640625, -7.692626953125, -7.39208984375, -7.091552734375, -6.791015625, -6.490478515625, -6.18994140625, -5.889404296875, -5.5888671875, -5.288330078125, -4.98779296875, -4.687255859375, -4.38671875, -4.086181640625, -3.78564453125, -3.485107421875, -3.1845703125, -2.884033203125, -2.58349609375, -2.282958984375, -1.982421875, -1.681884765625, -1.38134765625, -1.080810546875, -0.7802734375, -0.479736328125, -0.17919921875, 0.121337890625, 0.421875, 0.722412109375, 1.02294921875, 1.323486328125, 1.6240234375, 1.924560546875, 2.22509765625, 2.525634765625, 2.826171875, 3.126708984375, 3.42724609375, 3.727783203125, 4.0283203125, 4.328857421875, 4.62939453125, 4.929931640625, 5.23046875, 5.531005859375, 5.83154296875, 6.132080078125, 6.4326171875, 6.733154296875, 7.03369140625, 7.334228515625, 7.634765625, 7.935302734375, 8.23583984375, 8.536376953125, 8.8369140625, 9.137451171875, 9.43798828125, 9.738525390625, 10.0390625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 18.0, 20.0, 25.0, 35.0, 53.0, 66.0, 90.0, 97.0, 102.0, 88.0, 93.0, 78.0, 60.0, 45.0, 33.0, 22.0, 19.0, 16.0, 7.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.43256378173828, -33.533267974853516, -31.63397216796875, -29.734676361083984, -27.83538055419922, -25.936084747314453, -24.03679084777832, -22.137495040893555, -20.23819923400879, -18.338903427124023, -16.439607620239258, -14.540312767028809, -12.641016960144043, -10.741721153259277, -8.842426300048828, -6.9431304931640625, -5.043834686279297, -3.1445391178131104, -1.2452435493469238, 0.6540517807006836, 2.553347587585449, 4.452643394470215, 6.351938247680664, 8.25123405456543, 10.150529861450195, 12.049825668334961, 13.949121475219727, 15.848416328430176, 17.747711181640625, 19.64700698852539, 21.546302795410156, 23.445598602294922, 25.344894409179688, 27.244190216064453, 29.14348602294922, 31.042781829833984, 32.94207763671875, 34.841373443603516, 36.74066925048828, 38.63996124267578, 40.53926086425781, 42.43855667114258, 44.337852478027344, 46.23714828491211, 48.136444091796875, 50.03573989868164, 51.935035705566406, 53.834327697753906, 55.73362350463867, 57.63291931152344, 59.5322151184082, 61.43151092529297, 63.330806732177734, 65.2301025390625, 67.12939453125, 69.02869415283203, 70.92798614501953, 72.82727813720703, 74.72657775878906, 76.62586975097656, 78.5251693725586, 80.4244613647461, 82.32376098632812, 84.22305297851562, 86.12235260009766]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 5.0, 4.0, 11.0, 8.0, 12.0, 14.0, 12.0, 15.0, 26.0, 19.0, 28.0, 30.0, 32.0, 40.0, 38.0, 58.0, 57.0, 53.0, 45.0, 55.0, 49.0, 52.0, 55.0, 30.0, 31.0, 27.0, 33.0, 22.0, 24.0, 21.0, 15.0, 19.0, 10.0, 17.0, 9.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.38115692138672, -42.113739013671875, -40.846317291259766, -39.578895568847656, -38.31147766113281, -37.04405975341797, -35.77663803100586, -34.50921630859375, -33.241798400878906, -31.97437858581543, -30.706958770751953, -29.439538955688477, -28.172119140625, -26.904699325561523, -25.637279510498047, -24.36985969543457, -23.102439880371094, -21.835020065307617, -20.56760025024414, -19.300180435180664, -18.032760620117188, -16.76534080505371, -15.497920989990234, -14.230501174926758, -12.963081359863281, -11.695661544799805, -10.428241729736328, -9.160821914672852, -7.893402099609375, -6.625982284545898, -5.358562469482422, -4.091142654418945, -2.8237228393554688, -1.5563030242919922, -0.2888832092285156, 0.9785366058349609, 2.2459564208984375, 3.513376235961914, 4.780796051025391, 6.048215866088867, 7.315635681152344, 8.58305549621582, 9.850475311279297, 11.117895126342773, 12.38531494140625, 13.652734756469727, 14.920154571533203, 16.18757438659668, 17.454994201660156, 18.722414016723633, 19.98983383178711, 21.257253646850586, 22.524673461914062, 23.79209327697754, 25.059513092041016, 26.326932907104492, 27.59435272216797, 28.861772537231445, 30.129192352294922, 31.3966121673584, 32.664031982421875, 33.93144989013672, 35.19887161254883, 36.46629333496094, 37.73371124267578]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 7.0, 10.0, 9.0, 24.0, 44.0, 59.0, 69.0, 192.0, 253.0, 525.0, 943.0, 1768.0, 3455.0, 6918.0, 13927.0, 27859.0, 56319.0, 110090.0, 219459.0, 286067.0, 158881.0, 80202.0, 40948.0, 20256.0, 9837.0, 4957.0, 2564.0, 1288.0, 691.0, 408.0, 206.0, 135.0, 68.0, 42.0, 32.0, 17.0, 9.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.265625, -19.74951171875, -19.2333984375, -18.71728515625, -18.201171875, -17.68505859375, -17.1689453125, -16.65283203125, -16.13671875, -15.62060546875, -15.1044921875, -14.58837890625, -14.072265625, -13.55615234375, -13.0400390625, -12.52392578125, -12.0078125, -11.49169921875, -10.9755859375, -10.45947265625, -9.943359375, -9.42724609375, -8.9111328125, -8.39501953125, -7.87890625, -7.36279296875, -6.8466796875, -6.33056640625, -5.814453125, -5.29833984375, -4.7822265625, -4.26611328125, -3.75, -3.23388671875, -2.7177734375, -2.20166015625, -1.685546875, -1.16943359375, -0.6533203125, -0.13720703125, 0.37890625, 0.89501953125, 1.4111328125, 1.92724609375, 2.443359375, 2.95947265625, 3.4755859375, 3.99169921875, 4.5078125, 5.02392578125, 5.5400390625, 6.05615234375, 6.572265625, 7.08837890625, 7.6044921875, 8.12060546875, 8.63671875, 9.15283203125, 9.6689453125, 10.18505859375, 10.701171875, 11.21728515625, 11.7333984375, 12.24951171875, 12.765625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 10.0, 11.0, 12.0, 13.0, 10.0, 18.0, 14.0, 28.0, 24.0, 23.0, 31.0, 32.0, 36.0, 29.0, 31.0, 32.0, 49.0, 56.0, 41.0, 52.0, 49.0, 38.0, 43.0, 47.0, 44.0, 33.0, 29.0, 20.0, 23.0, 17.0, 13.0, 23.0, 8.0, 10.0, 7.0, 14.0, 11.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.817718505859375, -2.70770263671875, -2.597686767578125, -2.4876708984375, -2.377655029296875, -2.26763916015625, -2.157623291015625, -2.047607421875, -1.937591552734375, -1.82757568359375, -1.717559814453125, -1.6075439453125, -1.497528076171875, -1.38751220703125, -1.277496337890625, -1.16748046875, -1.057464599609375, -0.94744873046875, -0.837432861328125, -0.7274169921875, -0.617401123046875, -0.50738525390625, -0.397369384765625, -0.287353515625, -0.177337646484375, -0.06732177734375, 0.042694091796875, 0.1527099609375, 0.262725830078125, 0.37274169921875, 0.482757568359375, 0.5927734375, 0.702789306640625, 0.81280517578125, 0.922821044921875, 1.0328369140625, 1.142852783203125, 1.25286865234375, 1.362884521484375, 1.472900390625, 1.582916259765625, 1.69293212890625, 1.802947998046875, 1.9129638671875, 2.022979736328125, 2.13299560546875, 2.243011474609375, 2.35302734375, 2.463043212890625, 2.57305908203125, 2.683074951171875, 2.7930908203125, 2.903106689453125, 3.01312255859375, 3.123138427734375, 3.233154296875, 3.343170166015625, 3.45318603515625, 3.563201904296875, 3.6732177734375, 3.783233642578125, 3.89324951171875, 4.003265380859375, 4.11328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 4.0, 10.0, 11.0, 13.0, 13.0, 25.0, 44.0, 38.0, 62.0, 73.0, 122.0, 158.0, 252.0, 340.0, 546.0, 973.0, 1995.0, 4598.0, 11510.0, 33709.0, 99698.0, 307232.0, 387146.0, 129684.0, 44190.0, 15013.0, 5690.0, 2367.0, 1125.0, 645.0, 386.0, 256.0, 172.0, 135.0, 93.0, 47.0, 49.0, 39.0, 17.0, 17.0, 21.0, 9.0, 10.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.65625, -18.015625, -17.375, -16.734375, -16.09375, -15.453125, -14.8125, -14.171875, -13.53125, -12.890625, -12.25, -11.609375, -10.96875, -10.328125, -9.6875, -9.046875, -8.40625, -7.765625, -7.125, -6.484375, -5.84375, -5.203125, -4.5625, -3.921875, -3.28125, -2.640625, -2.0, -1.359375, -0.71875, -0.078125, 0.5625, 1.203125, 1.84375, 2.484375, 3.125, 3.765625, 4.40625, 5.046875, 5.6875, 6.328125, 6.96875, 7.609375, 8.25, 8.890625, 9.53125, 10.171875, 10.8125, 11.453125, 12.09375, 12.734375, 13.375, 14.015625, 14.65625, 15.296875, 15.9375, 16.578125, 17.21875, 17.859375, 18.5, 19.140625, 19.78125, 20.421875, 21.0625, 21.703125, 22.34375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 11.0, 10.0, 8.0, 14.0, 14.0, 19.0, 21.0, 34.0, 31.0, 22.0, 43.0, 47.0, 43.0, 49.0, 53.0, 58.0, 44.0, 52.0, 52.0, 58.0, 44.0, 36.0, 42.0, 38.0, 28.0, 25.0, 23.0, 16.0, 14.0, 10.0, 10.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0], "bins": [-23.765625, -23.1746826171875, -22.583740234375, -21.9927978515625, -21.40185546875, -20.8109130859375, -20.219970703125, -19.6290283203125, -19.0380859375, -18.4471435546875, -17.856201171875, -17.2652587890625, -16.67431640625, -16.0833740234375, -15.492431640625, -14.9014892578125, -14.310546875, -13.7196044921875, -13.128662109375, -12.5377197265625, -11.94677734375, -11.3558349609375, -10.764892578125, -10.1739501953125, -9.5830078125, -8.9920654296875, -8.401123046875, -7.8101806640625, -7.21923828125, -6.6282958984375, -6.037353515625, -5.4464111328125, -4.85546875, -4.2645263671875, -3.673583984375, -3.0826416015625, -2.49169921875, -1.9007568359375, -1.309814453125, -0.7188720703125, -0.1279296875, 0.4630126953125, 1.053955078125, 1.6448974609375, 2.23583984375, 2.8267822265625, 3.417724609375, 4.0086669921875, 4.599609375, 5.1905517578125, 5.781494140625, 6.3724365234375, 6.96337890625, 7.5543212890625, 8.145263671875, 8.7362060546875, 9.3271484375, 9.9180908203125, 10.509033203125, 11.0999755859375, 11.69091796875, 12.2818603515625, 12.872802734375, 13.4637451171875, 14.0546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 15.0, 12.0, 36.0, 49.0, 77.0, 114.0, 229.0, 466.0, 1049.0, 2864.0, 8508.0, 30912.0, 136170.0, 623329.0, 188316.0, 39952.0, 10720.0, 3323.0, 1287.0, 497.0, 255.0, 133.0, 76.0, 47.0, 40.0, 18.0, 20.0, 5.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.626708984375, -21.01904296875, -20.411376953125, -19.8037109375, -19.196044921875, -18.58837890625, -17.980712890625, -17.373046875, -16.765380859375, -16.15771484375, -15.550048828125, -14.9423828125, -14.334716796875, -13.72705078125, -13.119384765625, -12.51171875, -11.904052734375, -11.29638671875, -10.688720703125, -10.0810546875, -9.473388671875, -8.86572265625, -8.258056640625, -7.650390625, -7.042724609375, -6.43505859375, -5.827392578125, -5.2197265625, -4.612060546875, -4.00439453125, -3.396728515625, -2.7890625, -2.181396484375, -1.57373046875, -0.966064453125, -0.3583984375, 0.249267578125, 0.85693359375, 1.464599609375, 2.072265625, 2.679931640625, 3.28759765625, 3.895263671875, 4.5029296875, 5.110595703125, 5.71826171875, 6.325927734375, 6.93359375, 7.541259765625, 8.14892578125, 8.756591796875, 9.3642578125, 9.971923828125, 10.57958984375, 11.187255859375, 11.794921875, 12.402587890625, 13.01025390625, 13.617919921875, 14.2255859375, 14.833251953125, 15.44091796875, 16.048583984375, 16.65625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 14.0, 18.0, 26.0, 23.0, 39.0, 52.0, 106.0, 233.0, 219.0, 91.0, 50.0, 31.0, 24.0, 18.0, 9.0, 14.0, 5.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0059356689453125, -0.0057656168937683105, -0.005595564842224121, -0.005425512790679932, -0.005255460739135742, -0.005085408687591553, -0.004915356636047363, -0.004745304584503174, -0.004575252532958984, -0.004405200481414795, -0.0042351484298706055, -0.004065096378326416, -0.0038950443267822266, -0.003724992275238037, -0.0035549402236938477, -0.003384888172149658, -0.0032148361206054688, -0.0030447840690612793, -0.00287473201751709, -0.0027046799659729004, -0.002534627914428711, -0.0023645758628845215, -0.002194523811340332, -0.0020244717597961426, -0.0018544197082519531, -0.0016843676567077637, -0.0015143156051635742, -0.0013442635536193848, -0.0011742115020751953, -0.0010041594505310059, -0.0008341073989868164, -0.000664055347442627, -0.0004940032958984375, -0.00032395124435424805, -0.0001538991928100586, 1.615285873413086e-05, 0.0001862049102783203, 0.00035625696182250977, 0.0005263090133666992, 0.0006963610649108887, 0.0008664131164550781, 0.0010364651679992676, 0.001206517219543457, 0.0013765692710876465, 0.001546621322631836, 0.0017166733741760254, 0.0018867254257202148, 0.0020567774772644043, 0.0022268295288085938, 0.002396881580352783, 0.0025669336318969727, 0.002736985683441162, 0.0029070377349853516, 0.003077089786529541, 0.0032471418380737305, 0.00341719388961792, 0.0035872459411621094, 0.003757297992706299, 0.003927350044250488, 0.004097402095794678, 0.004267454147338867, 0.004437506198883057, 0.004607558250427246, 0.0047776103019714355, 0.004947662353515625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 6.0, 7.0, 8.0, 14.0, 30.0, 45.0, 50.0, 137.0, 203.0, 522.0, 1410.0, 5865.0, 34327.0, 452348.0, 507606.0, 37182.0, 6164.0, 1525.0, 527.0, 243.0, 126.0, 85.0, 34.0, 33.0, 16.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.171875, -23.242919921875, -22.31396484375, -21.385009765625, -20.4560546875, -19.527099609375, -18.59814453125, -17.669189453125, -16.740234375, -15.811279296875, -14.88232421875, -13.953369140625, -13.0244140625, -12.095458984375, -11.16650390625, -10.237548828125, -9.30859375, -8.379638671875, -7.45068359375, -6.521728515625, -5.5927734375, -4.663818359375, -3.73486328125, -2.805908203125, -1.876953125, -0.947998046875, -0.01904296875, 0.909912109375, 1.8388671875, 2.767822265625, 3.69677734375, 4.625732421875, 5.5546875, 6.483642578125, 7.41259765625, 8.341552734375, 9.2705078125, 10.199462890625, 11.12841796875, 12.057373046875, 12.986328125, 13.915283203125, 14.84423828125, 15.773193359375, 16.7021484375, 17.631103515625, 18.56005859375, 19.489013671875, 20.41796875, 21.346923828125, 22.27587890625, 23.204833984375, 24.1337890625, 25.062744140625, 25.99169921875, 26.920654296875, 27.849609375, 28.778564453125, 29.70751953125, 30.636474609375, 31.5654296875, 32.494384765625, 33.42333984375, 34.352294921875, 35.28125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 6.0, 13.0, 10.0, 24.0, 21.0, 45.0, 70.0, 105.0, 154.0, 155.0, 132.0, 84.0, 57.0, 41.0, 21.0, 18.0, 16.0, 12.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.34375, -12.79443359375, -12.2451171875, -11.69580078125, -11.146484375, -10.59716796875, -10.0478515625, -9.49853515625, -8.94921875, -8.39990234375, -7.8505859375, -7.30126953125, -6.751953125, -6.20263671875, -5.6533203125, -5.10400390625, -4.5546875, -4.00537109375, -3.4560546875, -2.90673828125, -2.357421875, -1.80810546875, -1.2587890625, -0.70947265625, -0.16015625, 0.38916015625, 0.9384765625, 1.48779296875, 2.037109375, 2.58642578125, 3.1357421875, 3.68505859375, 4.234375, 4.78369140625, 5.3330078125, 5.88232421875, 6.431640625, 6.98095703125, 7.5302734375, 8.07958984375, 8.62890625, 9.17822265625, 9.7275390625, 10.27685546875, 10.826171875, 11.37548828125, 11.9248046875, 12.47412109375, 13.0234375, 13.57275390625, 14.1220703125, 14.67138671875, 15.220703125, 15.77001953125, 16.3193359375, 16.86865234375, 17.41796875, 17.96728515625, 18.5166015625, 19.06591796875, 19.615234375, 20.16455078125, 20.7138671875, 21.26318359375, 21.8125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 12.0, 34.0, 59.0, 118.0, 171.0, 194.0, 197.0, 108.0, 52.0, 30.0, 15.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.4147491455078, -151.77200317382812, -143.1292724609375, -134.4865264892578, -125.84378051757812, -117.20103454589844, -108.55829620361328, -99.91555786132812, -91.27281188964844, -82.63006591796875, -73.9873275756836, -65.34458923339844, -56.70184326171875, -48.05910110473633, -39.416358947753906, -30.773616790771484, -22.130874633789062, -13.48813247680664, -4.845390319824219, 3.797351837158203, 12.440093994140625, 21.082836151123047, 29.72557830810547, 38.36832046508789, 47.01106262207031, 55.653804779052734, 64.29654693603516, 72.93928527832031, 81.58203125, 90.22477722167969, 98.86751556396484, 107.51025390625, 116.15301513671875, 124.79576110839844, 133.43850708007812, 142.08123779296875, 150.72398376464844, 159.36672973632812, 168.00946044921875, 176.65220642089844, 185.29495239257812, 193.9376983642578, 202.5804443359375, 211.22317504882812, 219.8659210205078, 228.5086669921875, 237.15139770507812, 245.7941436767578, 254.4368896484375, 263.0796203613281, 271.7223815917969, 280.3651123046875, 289.00787353515625, 297.6506042480469, 306.2933349609375, 314.93609619140625, 323.5788269042969, 332.2215576171875, 340.86431884765625, 349.5070495605469, 358.1497802734375, 366.79254150390625, 375.4352722167969, 384.0780334472656, 392.72076416015625]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 1.0, 3.0, 4.0, 4.0, 11.0, 8.0, 10.0, 11.0, 20.0, 26.0, 12.0, 21.0, 25.0, 22.0, 26.0, 24.0, 32.0, 30.0, 46.0, 42.0, 45.0, 37.0, 41.0, 50.0, 39.0, 37.0, 42.0, 29.0, 35.0, 40.0, 36.0, 19.0, 15.0, 24.0, 22.0, 27.0, 13.0, 15.0, 9.0, 9.0, 7.0, 4.0, 5.0, 5.0, 3.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.94683837890625, -73.39485168457031, -70.8428726196289, -68.29088592529297, -65.73890686035156, -63.186920166015625, -60.63493728637695, -58.08295440673828, -55.53097152709961, -52.97898864746094, -50.427005767822266, -47.875022888183594, -45.323036193847656, -42.77105712890625, -40.21907043457031, -37.66708755493164, -35.11510467529297, -32.5631217956543, -30.011138916015625, -27.45915412902832, -24.90717124938965, -22.355188369750977, -19.803203582763672, -17.251220703125, -14.699237823486328, -12.147254943847656, -9.595271110534668, -7.043287754058838, -4.491304397583008, -1.939321517944336, 0.6126623153686523, 3.1646461486816406, 5.7166290283203125, 8.268611907958984, 10.820595741271973, 13.372579574584961, 15.924562454223633, 18.476545333862305, 21.02853012084961, 23.58051300048828, 26.132495880126953, 28.684478759765625, 31.236461639404297, 33.78844451904297, 36.340431213378906, 38.89241027832031, 41.44439697265625, 43.99637985229492, 46.548362731933594, 49.100345611572266, 51.65232849121094, 54.20431137084961, 56.75629425048828, 59.30828094482422, 61.86026382446289, 64.41224670410156, 66.9642333984375, 69.51622009277344, 72.06819915771484, 74.62018585205078, 77.17216491699219, 79.72415161132812, 82.27613067626953, 84.82811737060547, 87.38009643554688]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 8.0, 15.0, 15.0, 22.0, 30.0, 61.0, 62.0, 137.0, 180.0, 314.0, 544.0, 795.0, 1361.0, 2363.0, 4038.0, 7314.0, 13725.0, 27591.0, 61578.0, 166338.0, 774907.0, 2655437.0, 300690.0, 95155.0, 40138.0, 19116.0, 9738.0, 5379.0, 2974.0, 1671.0, 977.0, 558.0, 383.0, 239.0, 132.0, 92.0, 69.0, 37.0, 39.0, 12.0, 15.0, 11.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.25, -15.745849609375, -15.24169921875, -14.737548828125, -14.2333984375, -13.729248046875, -13.22509765625, -12.720947265625, -12.216796875, -11.712646484375, -11.20849609375, -10.704345703125, -10.2001953125, -9.696044921875, -9.19189453125, -8.687744140625, -8.18359375, -7.679443359375, -7.17529296875, -6.671142578125, -6.1669921875, -5.662841796875, -5.15869140625, -4.654541015625, -4.150390625, -3.646240234375, -3.14208984375, -2.637939453125, -2.1337890625, -1.629638671875, -1.12548828125, -0.621337890625, -0.1171875, 0.386962890625, 0.89111328125, 1.395263671875, 1.8994140625, 2.403564453125, 2.90771484375, 3.411865234375, 3.916015625, 4.420166015625, 4.92431640625, 5.428466796875, 5.9326171875, 6.436767578125, 6.94091796875, 7.445068359375, 7.94921875, 8.453369140625, 8.95751953125, 9.461669921875, 9.9658203125, 10.469970703125, 10.97412109375, 11.478271484375, 11.982421875, 12.486572265625, 12.99072265625, 13.494873046875, 13.9990234375, 14.503173828125, 15.00732421875, 15.511474609375, 16.015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 6.0, 10.0, 7.0, 13.0, 5.0, 17.0, 23.0, 19.0, 24.0, 39.0, 23.0, 32.0, 45.0, 49.0, 35.0, 49.0, 70.0, 58.0, 60.0, 48.0, 49.0, 54.0, 32.0, 49.0, 25.0, 33.0, 25.0, 23.0, 15.0, 20.0, 11.0, 7.0, 14.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.04327392578125, -3.9107666015625, -3.77825927734375, -3.645751953125, -3.51324462890625, -3.3807373046875, -3.24822998046875, -3.11572265625, -2.98321533203125, -2.8507080078125, -2.71820068359375, -2.585693359375, -2.45318603515625, -2.3206787109375, -2.18817138671875, -2.0556640625, -1.92315673828125, -1.7906494140625, -1.65814208984375, -1.525634765625, -1.39312744140625, -1.2606201171875, -1.12811279296875, -0.99560546875, -0.86309814453125, -0.7305908203125, -0.59808349609375, -0.465576171875, -0.33306884765625, -0.2005615234375, -0.06805419921875, 0.064453125, 0.19696044921875, 0.3294677734375, 0.46197509765625, 0.594482421875, 0.72698974609375, 0.8594970703125, 0.99200439453125, 1.12451171875, 1.25701904296875, 1.3895263671875, 1.52203369140625, 1.654541015625, 1.78704833984375, 1.9195556640625, 2.05206298828125, 2.1845703125, 2.31707763671875, 2.4495849609375, 2.58209228515625, 2.714599609375, 2.84710693359375, 2.9796142578125, 3.11212158203125, 3.24462890625, 3.37713623046875, 3.5096435546875, 3.64215087890625, 3.774658203125, 3.90716552734375, 4.0396728515625, 4.17218017578125, 4.3046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 7.0, 15.0, 14.0, 22.0, 42.0, 64.0, 76.0, 137.0, 179.0, 266.0, 453.0, 705.0, 1132.0, 1880.0, 3210.0, 5650.0, 10135.0, 18837.0, 36896.0, 77884.0, 186566.0, 610545.0, 2349790.0, 560687.0, 176864.0, 74442.0, 35657.0, 18554.0, 9950.0, 5586.0, 3116.0, 1839.0, 1121.0, 643.0, 436.0, 293.0, 187.0, 128.0, 88.0, 59.0, 41.0, 28.0, 12.0, 11.0, 8.0, 4.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.890625, -14.41748046875, -13.9443359375, -13.47119140625, -12.998046875, -12.52490234375, -12.0517578125, -11.57861328125, -11.10546875, -10.63232421875, -10.1591796875, -9.68603515625, -9.212890625, -8.73974609375, -8.2666015625, -7.79345703125, -7.3203125, -6.84716796875, -6.3740234375, -5.90087890625, -5.427734375, -4.95458984375, -4.4814453125, -4.00830078125, -3.53515625, -3.06201171875, -2.5888671875, -2.11572265625, -1.642578125, -1.16943359375, -0.6962890625, -0.22314453125, 0.25, 0.72314453125, 1.1962890625, 1.66943359375, 2.142578125, 2.61572265625, 3.0888671875, 3.56201171875, 4.03515625, 4.50830078125, 4.9814453125, 5.45458984375, 5.927734375, 6.40087890625, 6.8740234375, 7.34716796875, 7.8203125, 8.29345703125, 8.7666015625, 9.23974609375, 9.712890625, 10.18603515625, 10.6591796875, 11.13232421875, 11.60546875, 12.07861328125, 12.5517578125, 13.02490234375, 13.498046875, 13.97119140625, 14.4443359375, 14.91748046875, 15.390625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 8.0, 15.0, 20.0, 21.0, 31.0, 36.0, 37.0, 45.0, 65.0, 81.0, 146.0, 217.0, 333.0, 640.0, 935.0, 490.0, 273.0, 169.0, 109.0, 94.0, 64.0, 46.0, 56.0, 29.0, 29.0, 11.0, 11.0, 15.0, 9.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.6796875, -8.3729248046875, -8.066162109375, -7.7593994140625, -7.45263671875, -7.1458740234375, -6.839111328125, -6.5323486328125, -6.2255859375, -5.9188232421875, -5.612060546875, -5.3052978515625, -4.99853515625, -4.6917724609375, -4.385009765625, -4.0782470703125, -3.771484375, -3.4647216796875, -3.157958984375, -2.8511962890625, -2.54443359375, -2.2376708984375, -1.930908203125, -1.6241455078125, -1.3173828125, -1.0106201171875, -0.703857421875, -0.3970947265625, -0.09033203125, 0.2164306640625, 0.523193359375, 0.8299560546875, 1.13671875, 1.4434814453125, 1.750244140625, 2.0570068359375, 2.36376953125, 2.6705322265625, 2.977294921875, 3.2840576171875, 3.5908203125, 3.8975830078125, 4.204345703125, 4.5111083984375, 4.81787109375, 5.1246337890625, 5.431396484375, 5.7381591796875, 6.044921875, 6.3516845703125, 6.658447265625, 6.9652099609375, 7.27197265625, 7.5787353515625, 7.885498046875, 8.1922607421875, 8.4990234375, 8.8057861328125, 9.112548828125, 9.4193115234375, 9.72607421875, 10.0328369140625, 10.339599609375, 10.6463623046875, 10.953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 9.0, 24.0, 55.0, 76.0, 143.0, 163.0, 162.0, 121.0, 103.0, 61.0, 45.0, 14.0, 11.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-138.03591918945312, -134.3201904296875, -130.60447692871094, -126.88874816894531, -123.17302703857422, -119.4572982788086, -115.7415771484375, -112.02584838867188, -108.31012725830078, -104.59440612792969, -100.87867736816406, -97.16295623779297, -93.44723510742188, -89.73150634765625, -86.01578521728516, -82.30006408691406, -78.58433532714844, -74.86861419677734, -71.15288543701172, -67.43716430664062, -63.721439361572266, -60.005714416503906, -56.28999328613281, -52.57426834106445, -48.858551025390625, -45.142826080322266, -41.42710494995117, -37.71138000488281, -33.99565505981445, -30.279932022094727, -26.564208984375, -22.84848403930664, -19.13275909423828, -15.417035102844238, -11.701311111450195, -7.985588073730469, -4.269864082336426, -0.5541400909423828, 3.1615829467773438, 6.877307891845703, 10.59303092956543, 14.308754920959473, 18.024478912353516, 21.740201950073242, 25.45592498779297, 29.171649932861328, 32.88737487792969, 36.60309600830078, 40.31882095336914, 44.0345458984375, 47.750267028808594, 51.46599197387695, 55.18171691894531, 58.897438049316406, 62.613162994384766, 66.32888793945312, 70.04460906982422, 73.76033020019531, 77.47605895996094, 81.19178009033203, 84.90750122070312, 88.62322998046875, 92.33895111083984, 96.05467224121094, 99.77040100097656]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 10.0, 8.0, 8.0, 14.0, 12.0, 15.0, 12.0, 17.0, 15.0, 34.0, 36.0, 24.0, 32.0, 30.0, 52.0, 39.0, 44.0, 34.0, 53.0, 50.0, 39.0, 41.0, 45.0, 30.0, 35.0, 33.0, 36.0, 26.0, 34.0, 27.0, 18.0, 16.0, 10.0, 10.0, 8.0, 7.0, 9.0, 5.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0], "bins": [-47.174259185791016, -45.86351776123047, -44.55277633666992, -43.242034912109375, -41.93129348754883, -40.62055206298828, -39.309810638427734, -37.99906921386719, -36.688323974609375, -35.37758255004883, -34.06684112548828, -32.756099700927734, -31.445358276367188, -30.13461685180664, -28.82387351989746, -27.513132095336914, -26.202392578125, -24.891651153564453, -23.580909729003906, -22.27016830444336, -20.959426879882812, -19.648685455322266, -18.337942123413086, -17.02720069885254, -15.716459274291992, -14.405717849731445, -13.094976425170898, -11.784234046936035, -10.473492622375488, -9.162751197814941, -7.852009296417236, -6.541267395019531, -5.230522155761719, -3.9197804927825928, -2.609038829803467, -1.2982971668243408, 0.012444496154785156, 1.323185920715332, 2.633927822113037, 3.944669723510742, 5.255411148071289, 6.566152572631836, 7.876894474029541, 9.187636375427246, 10.498377799987793, 11.80911922454834, 13.119861602783203, 14.43060302734375, 15.741344451904297, 17.052085876464844, 18.36282730102539, 19.673568725585938, 20.984310150146484, 22.29505157470703, 23.60579490661621, 24.916536331176758, 26.227277755737305, 27.53801918029785, 28.8487606048584, 30.159502029418945, 31.470245361328125, 32.78098678588867, 34.09172821044922, 35.402469635009766, 36.71321105957031]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 8.0, 5.0, 13.0, 26.0, 43.0, 49.0, 83.0, 144.0, 244.0, 406.0, 801.0, 1569.0, 3042.0, 6282.0, 13748.0, 31227.0, 75862.0, 259002.0, 457703.0, 116755.0, 44897.0, 19344.0, 8702.0, 4129.0, 2067.0, 1060.0, 591.0, 296.0, 208.0, 85.0, 57.0, 35.0, 26.0, 14.0, 6.0, 9.0, 10.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.803466796875, -20.09130859375, -19.379150390625, -18.6669921875, -17.954833984375, -17.24267578125, -16.530517578125, -15.818359375, -15.106201171875, -14.39404296875, -13.681884765625, -12.9697265625, -12.257568359375, -11.54541015625, -10.833251953125, -10.12109375, -9.408935546875, -8.69677734375, -7.984619140625, -7.2724609375, -6.560302734375, -5.84814453125, -5.135986328125, -4.423828125, -3.711669921875, -2.99951171875, -2.287353515625, -1.5751953125, -0.863037109375, -0.15087890625, 0.561279296875, 1.2734375, 1.985595703125, 2.69775390625, 3.409912109375, 4.1220703125, 4.834228515625, 5.54638671875, 6.258544921875, 6.970703125, 7.682861328125, 8.39501953125, 9.107177734375, 9.8193359375, 10.531494140625, 11.24365234375, 11.955810546875, 12.66796875, 13.380126953125, 14.09228515625, 14.804443359375, 15.5166015625, 16.228759765625, 16.94091796875, 17.653076171875, 18.365234375, 19.077392578125, 19.78955078125, 20.501708984375, 21.2138671875, 21.926025390625, 22.63818359375, 23.350341796875, 24.0625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 8.0, 14.0, 10.0, 11.0, 17.0, 24.0, 20.0, 30.0, 27.0, 27.0, 21.0, 41.0, 40.0, 58.0, 54.0, 68.0, 44.0, 50.0, 53.0, 56.0, 51.0, 37.0, 34.0, 32.0, 19.0, 30.0, 19.0, 20.0, 21.0, 21.0, 14.0, 7.0, 8.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9765625, -3.8427734375, -3.708984375, -3.5751953125, -3.44140625, -3.3076171875, -3.173828125, -3.0400390625, -2.90625, -2.7724609375, -2.638671875, -2.5048828125, -2.37109375, -2.2373046875, -2.103515625, -1.9697265625, -1.8359375, -1.7021484375, -1.568359375, -1.4345703125, -1.30078125, -1.1669921875, -1.033203125, -0.8994140625, -0.765625, -0.6318359375, -0.498046875, -0.3642578125, -0.23046875, -0.0966796875, 0.037109375, 0.1708984375, 0.3046875, 0.4384765625, 0.572265625, 0.7060546875, 0.83984375, 0.9736328125, 1.107421875, 1.2412109375, 1.375, 1.5087890625, 1.642578125, 1.7763671875, 1.91015625, 2.0439453125, 2.177734375, 2.3115234375, 2.4453125, 2.5791015625, 2.712890625, 2.8466796875, 2.98046875, 3.1142578125, 3.248046875, 3.3818359375, 3.515625, 3.6494140625, 3.783203125, 3.9169921875, 4.05078125, 4.1845703125, 4.318359375, 4.4521484375, 4.5859375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 6.0, 11.0, 15.0, 25.0, 22.0, 43.0, 51.0, 74.0, 104.0, 147.0, 225.0, 403.0, 617.0, 1130.0, 2324.0, 5357.0, 15002.0, 54229.0, 283194.0, 555263.0, 92663.0, 23401.0, 7473.0, 3086.0, 1470.0, 831.0, 481.0, 261.0, 192.0, 141.0, 74.0, 65.0, 43.0, 41.0, 14.0, 19.0, 14.0, 9.0, 4.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-28.21875, -27.393310546875, -26.56787109375, -25.742431640625, -24.9169921875, -24.091552734375, -23.26611328125, -22.440673828125, -21.615234375, -20.789794921875, -19.96435546875, -19.138916015625, -18.3134765625, -17.488037109375, -16.66259765625, -15.837158203125, -15.01171875, -14.186279296875, -13.36083984375, -12.535400390625, -11.7099609375, -10.884521484375, -10.05908203125, -9.233642578125, -8.408203125, -7.582763671875, -6.75732421875, -5.931884765625, -5.1064453125, -4.281005859375, -3.45556640625, -2.630126953125, -1.8046875, -0.979248046875, -0.15380859375, 0.671630859375, 1.4970703125, 2.322509765625, 3.14794921875, 3.973388671875, 4.798828125, 5.624267578125, 6.44970703125, 7.275146484375, 8.1005859375, 8.926025390625, 9.75146484375, 10.576904296875, 11.40234375, 12.227783203125, 13.05322265625, 13.878662109375, 14.7041015625, 15.529541015625, 16.35498046875, 17.180419921875, 18.005859375, 18.831298828125, 19.65673828125, 20.482177734375, 21.3076171875, 22.133056640625, 22.95849609375, 23.783935546875, 24.609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 7.0, 11.0, 10.0, 11.0, 13.0, 16.0, 23.0, 21.0, 27.0, 37.0, 50.0, 48.0, 46.0, 48.0, 64.0, 49.0, 53.0, 49.0, 43.0, 32.0, 54.0, 40.0, 37.0, 21.0, 35.0, 28.0, 25.0, 14.0, 17.0, 13.0, 10.0, 7.0, 11.0, 9.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.125, -16.51953125, -15.9140625, -15.30859375, -14.703125, -14.09765625, -13.4921875, -12.88671875, -12.28125, -11.67578125, -11.0703125, -10.46484375, -9.859375, -9.25390625, -8.6484375, -8.04296875, -7.4375, -6.83203125, -6.2265625, -5.62109375, -5.015625, -4.41015625, -3.8046875, -3.19921875, -2.59375, -1.98828125, -1.3828125, -0.77734375, -0.171875, 0.43359375, 1.0390625, 1.64453125, 2.25, 2.85546875, 3.4609375, 4.06640625, 4.671875, 5.27734375, 5.8828125, 6.48828125, 7.09375, 7.69921875, 8.3046875, 8.91015625, 9.515625, 10.12109375, 10.7265625, 11.33203125, 11.9375, 12.54296875, 13.1484375, 13.75390625, 14.359375, 14.96484375, 15.5703125, 16.17578125, 16.78125, 17.38671875, 17.9921875, 18.59765625, 19.203125, 19.80859375, 20.4140625, 21.01953125, 21.625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 7.0, 7.0, 13.0, 15.0, 22.0, 46.0, 88.0, 134.0, 283.0, 611.0, 1678.0, 5287.0, 24602.0, 332029.0, 639034.0, 34611.0, 6619.0, 1994.0, 701.0, 347.0, 163.0, 103.0, 65.0, 27.0, 21.0, 13.0, 11.0, 6.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.4375, -32.427001953125, -31.41650390625, -30.406005859375, -29.3955078125, -28.385009765625, -27.37451171875, -26.364013671875, -25.353515625, -24.343017578125, -23.33251953125, -22.322021484375, -21.3115234375, -20.301025390625, -19.29052734375, -18.280029296875, -17.26953125, -16.259033203125, -15.24853515625, -14.238037109375, -13.2275390625, -12.217041015625, -11.20654296875, -10.196044921875, -9.185546875, -8.175048828125, -7.16455078125, -6.154052734375, -5.1435546875, -4.133056640625, -3.12255859375, -2.112060546875, -1.1015625, -0.091064453125, 0.91943359375, 1.929931640625, 2.9404296875, 3.950927734375, 4.96142578125, 5.971923828125, 6.982421875, 7.992919921875, 9.00341796875, 10.013916015625, 11.0244140625, 12.034912109375, 13.04541015625, 14.055908203125, 15.06640625, 16.076904296875, 17.08740234375, 18.097900390625, 19.1083984375, 20.118896484375, 21.12939453125, 22.139892578125, 23.150390625, 24.160888671875, 25.17138671875, 26.181884765625, 27.1923828125, 28.202880859375, 29.21337890625, 30.223876953125, 31.234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 4.0, 11.0, 8.0, 8.0, 17.0, 22.0, 38.0, 41.0, 70.0, 190.0, 246.0, 111.0, 62.0, 32.0, 32.0, 18.0, 16.0, 16.0, 8.0, 6.0, 7.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00412750244140625, -0.00398629903793335, -0.0038450956344604492, -0.003703892230987549, -0.0035626888275146484, -0.003421485424041748, -0.0032802820205688477, -0.0031390786170959473, -0.002997875213623047, -0.0028566718101501465, -0.002715468406677246, -0.0025742650032043457, -0.0024330615997314453, -0.002291858196258545, -0.0021506547927856445, -0.002009451389312744, -0.0018682479858398438, -0.0017270445823669434, -0.001585841178894043, -0.0014446377754211426, -0.0013034343719482422, -0.0011622309684753418, -0.0010210275650024414, -0.000879824161529541, -0.0007386207580566406, -0.0005974173545837402, -0.00045621395111083984, -0.00031501054763793945, -0.00017380714416503906, -3.260374069213867e-05, 0.00010859966278076172, 0.0002498030662536621, 0.0003910064697265625, 0.0005322098731994629, 0.0006734132766723633, 0.0008146166801452637, 0.0009558200836181641, 0.0010970234870910645, 0.0012382268905639648, 0.0013794302940368652, 0.0015206336975097656, 0.001661837100982666, 0.0018030405044555664, 0.0019442439079284668, 0.002085447311401367, 0.0022266507148742676, 0.002367854118347168, 0.0025090575218200684, 0.0026502609252929688, 0.002791464328765869, 0.0029326677322387695, 0.00307387113571167, 0.0032150745391845703, 0.0033562779426574707, 0.003497481346130371, 0.0036386847496032715, 0.003779888153076172, 0.003921091556549072, 0.004062294960021973, 0.004203498363494873, 0.0043447017669677734, 0.004485905170440674, 0.004627108573913574, 0.004768311977386475, 0.004909515380859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 3.0, 9.0, 4.0, 20.0, 20.0, 31.0, 42.0, 92.0, 116.0, 211.0, 370.0, 755.0, 1571.0, 4161.0, 12467.0, 53044.0, 626115.0, 298643.0, 35667.0, 9144.0, 3178.0, 1371.0, 693.0, 341.0, 191.0, 94.0, 67.0, 45.0, 25.0, 20.0, 10.0, 6.0, 6.0, 3.0, 12.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.46875, -22.7548828125, -22.041015625, -21.3271484375, -20.61328125, -19.8994140625, -19.185546875, -18.4716796875, -17.7578125, -17.0439453125, -16.330078125, -15.6162109375, -14.90234375, -14.1884765625, -13.474609375, -12.7607421875, -12.046875, -11.3330078125, -10.619140625, -9.9052734375, -9.19140625, -8.4775390625, -7.763671875, -7.0498046875, -6.3359375, -5.6220703125, -4.908203125, -4.1943359375, -3.48046875, -2.7666015625, -2.052734375, -1.3388671875, -0.625, 0.0888671875, 0.802734375, 1.5166015625, 2.23046875, 2.9443359375, 3.658203125, 4.3720703125, 5.0859375, 5.7998046875, 6.513671875, 7.2275390625, 7.94140625, 8.6552734375, 9.369140625, 10.0830078125, 10.796875, 11.5107421875, 12.224609375, 12.9384765625, 13.65234375, 14.3662109375, 15.080078125, 15.7939453125, 16.5078125, 17.2216796875, 17.935546875, 18.6494140625, 19.36328125, 20.0771484375, 20.791015625, 21.5048828125, 22.21875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 7.0, 11.0, 9.0, 9.0, 9.0, 25.0, 34.0, 45.0, 66.0, 139.0, 168.0, 180.0, 110.0, 50.0, 34.0, 24.0, 17.0, 15.0, 13.0, 11.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5859375, -13.0809326171875, -12.575927734375, -12.0709228515625, -11.56591796875, -11.0609130859375, -10.555908203125, -10.0509033203125, -9.5458984375, -9.0408935546875, -8.535888671875, -8.0308837890625, -7.52587890625, -7.0208740234375, -6.515869140625, -6.0108642578125, -5.505859375, -5.0008544921875, -4.495849609375, -3.9908447265625, -3.48583984375, -2.9808349609375, -2.475830078125, -1.9708251953125, -1.4658203125, -0.9608154296875, -0.455810546875, 0.0491943359375, 0.55419921875, 1.0592041015625, 1.564208984375, 2.0692138671875, 2.57421875, 3.0792236328125, 3.584228515625, 4.0892333984375, 4.59423828125, 5.0992431640625, 5.604248046875, 6.1092529296875, 6.6142578125, 7.1192626953125, 7.624267578125, 8.1292724609375, 8.63427734375, 9.1392822265625, 9.644287109375, 10.1492919921875, 10.654296875, 11.1593017578125, 11.664306640625, 12.1693115234375, 12.67431640625, 13.1793212890625, 13.684326171875, 14.1893310546875, 14.6943359375, 15.1993408203125, 15.704345703125, 16.2093505859375, 16.71435546875, 17.2193603515625, 17.724365234375, 18.2293701171875, 18.734375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 12.0, 28.0, 58.0, 113.0, 164.0, 197.0, 154.0, 111.0, 80.0, 42.0, 14.0, 12.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.37586975097656, -139.50830078125, -130.64073181152344, -121.77316284179688, -112.90559387207031, -104.03802490234375, -95.17045593261719, -86.30288696289062, -77.43531799316406, -68.5677490234375, -59.70018005371094, -50.832611083984375, -41.96504211425781, -33.09747314453125, -24.229904174804688, -15.362335205078125, -6.4947662353515625, 2.372802734375, 11.240371704101562, 20.107940673828125, 28.975509643554688, 37.84307861328125, 46.71064758300781, 55.578216552734375, 64.44578552246094, 73.3133544921875, 82.18092346191406, 91.04849243164062, 99.91606140136719, 108.78363037109375, 117.65119934082031, 126.51876831054688, 135.3863525390625, 144.25392150878906, 153.12149047851562, 161.9890594482422, 170.85662841796875, 179.7241973876953, 188.59176635742188, 197.45933532714844, 206.326904296875, 215.19447326660156, 224.06204223632812, 232.9296112060547, 241.79718017578125, 250.6647491455078, 259.5323181152344, 268.39990234375, 277.2674560546875, 286.135009765625, 295.0025939941406, 303.87017822265625, 312.73773193359375, 321.60528564453125, 330.4728698730469, 339.3404541015625, 348.2080078125, 357.0755615234375, 365.9431457519531, 374.81072998046875, 383.67828369140625, 392.54583740234375, 401.4134216308594, 410.281005859375, 419.1485595703125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 10.0, 10.0, 10.0, 16.0, 10.0, 16.0, 23.0, 23.0, 15.0, 29.0, 29.0, 25.0, 40.0, 32.0, 45.0, 42.0, 40.0, 39.0, 41.0, 39.0, 47.0, 42.0, 44.0, 31.0, 32.0, 38.0, 25.0, 26.0, 22.0, 23.0, 23.0, 20.0, 10.0, 18.0, 14.0, 13.0, 5.0, 5.0, 5.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-80.12784576416016, -77.42349243164062, -74.7191390991211, -72.01478576660156, -69.3104248046875, -66.60607147216797, -63.90171813964844, -61.197364807128906, -58.493011474609375, -55.788658142089844, -53.08430480957031, -50.379947662353516, -47.675594329833984, -44.97124099731445, -42.266883850097656, -39.562530517578125, -36.858177185058594, -34.15382385253906, -31.4494686126709, -28.745113372802734, -26.040760040283203, -23.336406707763672, -20.632051467895508, -17.927696228027344, -15.223342895507812, -12.518988609313965, -9.814634323120117, -7.1102800369262695, -4.405925750732422, -1.7015714645385742, 1.0027828216552734, 3.7071380615234375, 6.4114837646484375, 9.115838050842285, 11.820192337036133, 14.52454662322998, 17.228900909423828, 19.93325424194336, 22.637609481811523, 25.341964721679688, 28.04631805419922, 30.75067138671875, 33.45502471923828, 36.15938186645508, 38.86373519897461, 41.56808853149414, 44.27244567871094, 46.97679901123047, 49.68115234375, 52.38550567626953, 55.08985900878906, 57.79421615600586, 60.49856948852539, 63.20292282104492, 65.90727996826172, 68.61163330078125, 71.31598663330078, 74.02033996582031, 76.72469329833984, 79.42904663085938, 82.13340759277344, 84.83776092529297, 87.5421142578125, 90.24646759033203, 92.95082092285156]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 5.0, 6.0, 21.0, 14.0, 21.0, 28.0, 41.0, 54.0, 83.0, 129.0, 202.0, 322.0, 511.0, 743.0, 1128.0, 2067.0, 3553.0, 6227.0, 11617.0, 24266.0, 57685.0, 178455.0, 1937326.0, 1684657.0, 176242.0, 57371.0, 24472.0, 11876.0, 6275.0, 3510.0, 1991.0, 1267.0, 730.0, 429.0, 335.0, 199.0, 122.0, 85.0, 74.0, 44.0, 29.0, 16.0, 16.0, 17.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.341552734375, -17.72998046875, -17.118408203125, -16.5068359375, -15.895263671875, -15.28369140625, -14.672119140625, -14.060546875, -13.448974609375, -12.83740234375, -12.225830078125, -11.6142578125, -11.002685546875, -10.39111328125, -9.779541015625, -9.16796875, -8.556396484375, -7.94482421875, -7.333251953125, -6.7216796875, -6.110107421875, -5.49853515625, -4.886962890625, -4.275390625, -3.663818359375, -3.05224609375, -2.440673828125, -1.8291015625, -1.217529296875, -0.60595703125, 0.005615234375, 0.6171875, 1.228759765625, 1.84033203125, 2.451904296875, 3.0634765625, 3.675048828125, 4.28662109375, 4.898193359375, 5.509765625, 6.121337890625, 6.73291015625, 7.344482421875, 7.9560546875, 8.567626953125, 9.17919921875, 9.790771484375, 10.40234375, 11.013916015625, 11.62548828125, 12.237060546875, 12.8486328125, 13.460205078125, 14.07177734375, 14.683349609375, 15.294921875, 15.906494140625, 16.51806640625, 17.129638671875, 17.7412109375, 18.352783203125, 18.96435546875, 19.575927734375, 20.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 5.0, 2.0, 12.0, 9.0, 18.0, 18.0, 9.0, 13.0, 15.0, 24.0, 20.0, 27.0, 30.0, 40.0, 26.0, 44.0, 39.0, 48.0, 42.0, 56.0, 53.0, 51.0, 55.0, 26.0, 36.0, 39.0, 38.0, 20.0, 27.0, 34.0, 26.0, 18.0, 18.0, 9.0, 5.0, 10.0, 11.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.01953125, -3.88818359375, -3.7568359375, -3.62548828125, -3.494140625, -3.36279296875, -3.2314453125, -3.10009765625, -2.96875, -2.83740234375, -2.7060546875, -2.57470703125, -2.443359375, -2.31201171875, -2.1806640625, -2.04931640625, -1.91796875, -1.78662109375, -1.6552734375, -1.52392578125, -1.392578125, -1.26123046875, -1.1298828125, -0.99853515625, -0.8671875, -0.73583984375, -0.6044921875, -0.47314453125, -0.341796875, -0.21044921875, -0.0791015625, 0.05224609375, 0.18359375, 0.31494140625, 0.4462890625, 0.57763671875, 0.708984375, 0.84033203125, 0.9716796875, 1.10302734375, 1.234375, 1.36572265625, 1.4970703125, 1.62841796875, 1.759765625, 1.89111328125, 2.0224609375, 2.15380859375, 2.28515625, 2.41650390625, 2.5478515625, 2.67919921875, 2.810546875, 2.94189453125, 3.0732421875, 3.20458984375, 3.3359375, 3.46728515625, 3.5986328125, 3.72998046875, 3.861328125, 3.99267578125, 4.1240234375, 4.25537109375, 4.38671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 9.0, 14.0, 12.0, 24.0, 31.0, 30.0, 67.0, 83.0, 169.0, 209.0, 400.0, 631.0, 1255.0, 2219.0, 4323.0, 9354.0, 23052.0, 74618.0, 412284.0, 3193277.0, 363209.0, 68800.0, 21835.0, 9109.0, 4294.0, 2195.0, 1148.0, 619.0, 366.0, 241.0, 137.0, 102.0, 62.0, 31.0, 26.0, 12.0, 10.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.03125, -27.111328125, -26.19140625, -25.271484375, -24.3515625, -23.431640625, -22.51171875, -21.591796875, -20.671875, -19.751953125, -18.83203125, -17.912109375, -16.9921875, -16.072265625, -15.15234375, -14.232421875, -13.3125, -12.392578125, -11.47265625, -10.552734375, -9.6328125, -8.712890625, -7.79296875, -6.873046875, -5.953125, -5.033203125, -4.11328125, -3.193359375, -2.2734375, -1.353515625, -0.43359375, 0.486328125, 1.40625, 2.326171875, 3.24609375, 4.166015625, 5.0859375, 6.005859375, 6.92578125, 7.845703125, 8.765625, 9.685546875, 10.60546875, 11.525390625, 12.4453125, 13.365234375, 14.28515625, 15.205078125, 16.125, 17.044921875, 17.96484375, 18.884765625, 19.8046875, 20.724609375, 21.64453125, 22.564453125, 23.484375, 24.404296875, 25.32421875, 26.244140625, 27.1640625, 28.083984375, 29.00390625, 29.923828125, 30.84375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 4.0, 4.0, 10.0, 12.0, 20.0, 38.0, 40.0, 64.0, 138.0, 175.0, 383.0, 1023.0, 1182.0, 393.0, 210.0, 117.0, 82.0, 39.0, 27.0, 25.0, 20.0, 9.0, 13.0, 7.0, 10.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -16.0513916015625, -15.618408203125, -15.1854248046875, -14.75244140625, -14.3194580078125, -13.886474609375, -13.4534912109375, -13.0205078125, -12.5875244140625, -12.154541015625, -11.7215576171875, -11.28857421875, -10.8555908203125, -10.422607421875, -9.9896240234375, -9.556640625, -9.1236572265625, -8.690673828125, -8.2576904296875, -7.82470703125, -7.3917236328125, -6.958740234375, -6.5257568359375, -6.0927734375, -5.6597900390625, -5.226806640625, -4.7938232421875, -4.36083984375, -3.9278564453125, -3.494873046875, -3.0618896484375, -2.62890625, -2.1959228515625, -1.762939453125, -1.3299560546875, -0.89697265625, -0.4639892578125, -0.031005859375, 0.4019775390625, 0.8349609375, 1.2679443359375, 1.700927734375, 2.1339111328125, 2.56689453125, 2.9998779296875, 3.432861328125, 3.8658447265625, 4.298828125, 4.7318115234375, 5.164794921875, 5.5977783203125, 6.03076171875, 6.4637451171875, 6.896728515625, 7.3297119140625, 7.7626953125, 8.1956787109375, 8.628662109375, 9.0616455078125, 9.49462890625, 9.9276123046875, 10.360595703125, 10.7935791015625, 11.2265625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 10.0, 16.0, 28.0, 46.0, 58.0, 84.0, 96.0, 103.0, 137.0, 102.0, 100.0, 71.0, 57.0, 31.0, 13.0, 14.0, 9.0, 9.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.20120239257812, -71.48805236816406, -68.77489471435547, -66.0617446899414, -63.34859085083008, -60.63543701171875, -57.92228698730469, -55.20913314819336, -52.49597930908203, -49.7828254699707, -47.06967544555664, -44.35652160644531, -41.643367767333984, -38.930213928222656, -36.217063903808594, -33.503910064697266, -30.790760040283203, -28.077608108520508, -25.36445426940918, -22.651302337646484, -19.938148498535156, -17.22499656677246, -14.511844635009766, -11.798690795898438, -9.085538864135742, -6.3723859786987305, -3.659233570098877, -0.9460811614990234, 1.7670717239379883, 4.480224609375, 7.193376541137695, 9.906530380249023, 12.619682312011719, 15.33283519744873, 18.045988082885742, 20.759140014648438, 23.472293853759766, 26.18544578552246, 28.898597717285156, 31.611751556396484, 34.32490539550781, 37.03805923461914, 39.7512092590332, 42.46436309814453, 45.17751693725586, 47.89067077636719, 50.60382080078125, 53.31697463989258, 56.03012466430664, 58.74327850341797, 61.45642852783203, 64.16958618164062, 66.88273620605469, 69.59588623046875, 72.30903625488281, 75.0221939086914, 77.73534393310547, 80.44849395751953, 83.16165161132812, 85.87480163574219, 88.58795166015625, 91.30110931396484, 94.0142593383789, 96.7274169921875, 99.44056701660156]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 10.0, 14.0, 6.0, 14.0, 14.0, 18.0, 22.0, 21.0, 28.0, 38.0, 45.0, 36.0, 40.0, 35.0, 41.0, 46.0, 44.0, 39.0, 42.0, 43.0, 44.0, 41.0, 39.0, 29.0, 29.0, 30.0, 27.0, 23.0, 18.0, 17.0, 13.0, 23.0, 11.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.97904586791992, -39.616050720214844, -38.25305938720703, -36.89006423950195, -35.527069091796875, -34.1640739440918, -32.80107879638672, -31.438087463378906, -30.075092315673828, -28.71209716796875, -27.349103927612305, -25.98611068725586, -24.62311553955078, -23.260120391845703, -21.897127151489258, -20.534133911132812, -19.171138763427734, -17.808143615722656, -16.44515037536621, -15.08215618133545, -13.719161987304688, -12.356167793273926, -10.993173599243164, -9.630179405212402, -8.26718521118164, -6.904191017150879, -5.541196823120117, -4.1782026290893555, -2.8152084350585938, -1.452214241027832, -0.08922004699707031, 1.2737741470336914, 2.636768341064453, 3.999762535095215, 5.362756729125977, 6.725750923156738, 8.0887451171875, 9.451739311218262, 10.814733505249023, 12.177727699279785, 13.540721893310547, 14.903716087341309, 16.26671028137207, 17.629703521728516, 18.992698669433594, 20.355693817138672, 21.718687057495117, 23.081680297851562, 24.44467544555664, 25.80767059326172, 27.170663833618164, 28.53365707397461, 29.896652221679688, 31.259647369384766, 32.622642517089844, 33.985633850097656, 35.348628997802734, 36.71162414550781, 38.074615478515625, 39.4376106262207, 40.80060577392578, 42.16360092163086, 43.52659606933594, 44.88958740234375, 46.25258255004883]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 9.0, 9.0, 13.0, 8.0, 20.0, 20.0, 19.0, 42.0, 54.0, 74.0, 123.0, 212.0, 337.0, 599.0, 1032.0, 1925.0, 3584.0, 6885.0, 13253.0, 26560.0, 56506.0, 177557.0, 480379.0, 170168.0, 55367.0, 25976.0, 13084.0, 6893.0, 3462.0, 1839.0, 1042.0, 587.0, 342.0, 197.0, 114.0, 80.0, 59.0, 34.0, 16.0, 16.0, 21.0, 12.0, 10.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.59375, -16.01123046875, -15.4287109375, -14.84619140625, -14.263671875, -13.68115234375, -13.0986328125, -12.51611328125, -11.93359375, -11.35107421875, -10.7685546875, -10.18603515625, -9.603515625, -9.02099609375, -8.4384765625, -7.85595703125, -7.2734375, -6.69091796875, -6.1083984375, -5.52587890625, -4.943359375, -4.36083984375, -3.7783203125, -3.19580078125, -2.61328125, -2.03076171875, -1.4482421875, -0.86572265625, -0.283203125, 0.29931640625, 0.8818359375, 1.46435546875, 2.046875, 2.62939453125, 3.2119140625, 3.79443359375, 4.376953125, 4.95947265625, 5.5419921875, 6.12451171875, 6.70703125, 7.28955078125, 7.8720703125, 8.45458984375, 9.037109375, 9.61962890625, 10.2021484375, 10.78466796875, 11.3671875, 11.94970703125, 12.5322265625, 13.11474609375, 13.697265625, 14.27978515625, 14.8623046875, 15.44482421875, 16.02734375, 16.60986328125, 17.1923828125, 17.77490234375, 18.357421875, 18.93994140625, 19.5224609375, 20.10498046875, 20.6875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 6.0, 4.0, 2.0, 9.0, 11.0, 13.0, 15.0, 14.0, 20.0, 14.0, 25.0, 23.0, 33.0, 30.0, 29.0, 32.0, 32.0, 40.0, 52.0, 54.0, 46.0, 50.0, 35.0, 37.0, 38.0, 51.0, 46.0, 34.0, 23.0, 22.0, 22.0, 28.0, 19.0, 19.0, 13.0, 9.0, 15.0, 7.0, 6.0, 7.0, 3.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.078125, -3.93670654296875, -3.7952880859375, -3.65386962890625, -3.512451171875, -3.37103271484375, -3.2296142578125, -3.08819580078125, -2.94677734375, -2.80535888671875, -2.6639404296875, -2.52252197265625, -2.381103515625, -2.23968505859375, -2.0982666015625, -1.95684814453125, -1.8154296875, -1.67401123046875, -1.5325927734375, -1.39117431640625, -1.249755859375, -1.10833740234375, -0.9669189453125, -0.82550048828125, -0.68408203125, -0.54266357421875, -0.4012451171875, -0.25982666015625, -0.118408203125, 0.02301025390625, 0.1644287109375, 0.30584716796875, 0.447265625, 0.58868408203125, 0.7301025390625, 0.87152099609375, 1.012939453125, 1.15435791015625, 1.2957763671875, 1.43719482421875, 1.57861328125, 1.72003173828125, 1.8614501953125, 2.00286865234375, 2.144287109375, 2.28570556640625, 2.4271240234375, 2.56854248046875, 2.7099609375, 2.85137939453125, 2.9927978515625, 3.13421630859375, 3.275634765625, 3.41705322265625, 3.5584716796875, 3.69989013671875, 3.84130859375, 3.98272705078125, 4.1241455078125, 4.26556396484375, 4.406982421875, 4.54840087890625, 4.6898193359375, 4.83123779296875, 4.97265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 11.0, 13.0, 13.0, 20.0, 17.0, 39.0, 50.0, 79.0, 105.0, 203.0, 329.0, 636.0, 1203.0, 2786.0, 6435.0, 15942.0, 42174.0, 225011.0, 644881.0, 67569.0, 23958.0, 9442.0, 4076.0, 1675.0, 829.0, 430.0, 219.0, 128.0, 73.0, 63.0, 33.0, 19.0, 24.0, 11.0, 14.0, 14.0, 9.0, 5.0, 1.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.6875, -26.7060546875, -25.724609375, -24.7431640625, -23.76171875, -22.7802734375, -21.798828125, -20.8173828125, -19.8359375, -18.8544921875, -17.873046875, -16.8916015625, -15.91015625, -14.9287109375, -13.947265625, -12.9658203125, -11.984375, -11.0029296875, -10.021484375, -9.0400390625, -8.05859375, -7.0771484375, -6.095703125, -5.1142578125, -4.1328125, -3.1513671875, -2.169921875, -1.1884765625, -0.20703125, 0.7744140625, 1.755859375, 2.7373046875, 3.71875, 4.7001953125, 5.681640625, 6.6630859375, 7.64453125, 8.6259765625, 9.607421875, 10.5888671875, 11.5703125, 12.5517578125, 13.533203125, 14.5146484375, 15.49609375, 16.4775390625, 17.458984375, 18.4404296875, 19.421875, 20.4033203125, 21.384765625, 22.3662109375, 23.34765625, 24.3291015625, 25.310546875, 26.2919921875, 27.2734375, 28.2548828125, 29.236328125, 30.2177734375, 31.19921875, 32.1806640625, 33.162109375, 34.1435546875, 35.125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 7.0, 7.0, 7.0, 3.0, 7.0, 16.0, 14.0, 30.0, 37.0, 42.0, 46.0, 54.0, 65.0, 57.0, 67.0, 86.0, 67.0, 70.0, 59.0, 46.0, 47.0, 37.0, 26.0, 18.0, 23.0, 16.0, 10.0, 8.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.21875, -28.2177734375, -27.216796875, -26.2158203125, -25.21484375, -24.2138671875, -23.212890625, -22.2119140625, -21.2109375, -20.2099609375, -19.208984375, -18.2080078125, -17.20703125, -16.2060546875, -15.205078125, -14.2041015625, -13.203125, -12.2021484375, -11.201171875, -10.2001953125, -9.19921875, -8.1982421875, -7.197265625, -6.1962890625, -5.1953125, -4.1943359375, -3.193359375, -2.1923828125, -1.19140625, -0.1904296875, 0.810546875, 1.8115234375, 2.8125, 3.8134765625, 4.814453125, 5.8154296875, 6.81640625, 7.8173828125, 8.818359375, 9.8193359375, 10.8203125, 11.8212890625, 12.822265625, 13.8232421875, 14.82421875, 15.8251953125, 16.826171875, 17.8271484375, 18.828125, 19.8291015625, 20.830078125, 21.8310546875, 22.83203125, 23.8330078125, 24.833984375, 25.8349609375, 26.8359375, 27.8369140625, 28.837890625, 29.8388671875, 30.83984375, 31.8408203125, 32.841796875, 33.8427734375, 34.84375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 9.0, 25.0, 19.0, 32.0, 57.0, 95.0, 210.0, 316.0, 574.0, 1305.0, 2773.0, 6464.0, 16030.0, 41918.0, 186585.0, 677007.0, 71098.0, 26023.0, 10079.0, 4164.0, 1852.0, 881.0, 457.0, 236.0, 149.0, 60.0, 48.0, 36.0, 18.0, 17.0, 4.0, 7.0, 5.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.54248046875, -12.9599609375, -12.37744140625, -11.794921875, -11.21240234375, -10.6298828125, -10.04736328125, -9.46484375, -8.88232421875, -8.2998046875, -7.71728515625, -7.134765625, -6.55224609375, -5.9697265625, -5.38720703125, -4.8046875, -4.22216796875, -3.6396484375, -3.05712890625, -2.474609375, -1.89208984375, -1.3095703125, -0.72705078125, -0.14453125, 0.43798828125, 1.0205078125, 1.60302734375, 2.185546875, 2.76806640625, 3.3505859375, 3.93310546875, 4.515625, 5.09814453125, 5.6806640625, 6.26318359375, 6.845703125, 7.42822265625, 8.0107421875, 8.59326171875, 9.17578125, 9.75830078125, 10.3408203125, 10.92333984375, 11.505859375, 12.08837890625, 12.6708984375, 13.25341796875, 13.8359375, 14.41845703125, 15.0009765625, 15.58349609375, 16.166015625, 16.74853515625, 17.3310546875, 17.91357421875, 18.49609375, 19.07861328125, 19.6611328125, 20.24365234375, 20.826171875, 21.40869140625, 21.9912109375, 22.57373046875, 23.15625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 6.0, 8.0, 8.0, 5.0, 14.0, 3.0, 9.0, 12.0, 26.0, 25.0, 46.0, 172.0, 323.0, 158.0, 58.0, 19.0, 17.0, 17.0, 8.0, 8.0, 6.0, 2.0, 10.0, 11.0, 2.0, 8.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00447845458984375, -0.0043315887451171875, -0.004184722900390625, -0.0040378570556640625, -0.0038909912109375, -0.0037441253662109375, -0.003597259521484375, -0.0034503936767578125, -0.00330352783203125, -0.0031566619873046875, -0.003009796142578125, -0.0028629302978515625, -0.002716064453125, -0.0025691986083984375, -0.002422332763671875, -0.0022754669189453125, -0.00212860107421875, -0.0019817352294921875, -0.001834869384765625, -0.0016880035400390625, -0.0015411376953125, -0.0013942718505859375, -0.001247406005859375, -0.0011005401611328125, -0.00095367431640625, -0.0008068084716796875, -0.000659942626953125, -0.0005130767822265625, -0.0003662109375, -0.0002193450927734375, -7.2479248046875e-05, 7.43865966796875e-05, 0.00022125244140625, 0.0003681182861328125, 0.000514984130859375, 0.0006618499755859375, 0.0008087158203125, 0.0009555816650390625, 0.001102447509765625, 0.0012493133544921875, 0.00139617919921875, 0.0015430450439453125, 0.001689910888671875, 0.0018367767333984375, 0.001983642578125, 0.0021305084228515625, 0.002277374267578125, 0.0024242401123046875, 0.00257110595703125, 0.0027179718017578125, 0.002864837646484375, 0.0030117034912109375, 0.0031585693359375, 0.0033054351806640625, 0.003452301025390625, 0.0035991668701171875, 0.00374603271484375, 0.0038928985595703125, 0.004039764404296875, 0.0041866302490234375, 0.00433349609375, 0.0044803619384765625, 0.004627227783203125, 0.0047740936279296875, 0.00492095947265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 8.0, 14.0, 20.0, 27.0, 54.0, 85.0, 105.0, 196.0, 312.0, 526.0, 874.0, 1807.0, 4136.0, 10179.0, 26482.0, 73320.0, 656074.0, 202187.0, 43281.0, 16659.0, 6521.0, 2721.0, 1268.0, 648.0, 396.0, 211.0, 145.0, 91.0, 59.0, 35.0, 28.0, 20.0, 16.0, 8.0, 5.0, 9.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-18.703125, -18.1650390625, -17.626953125, -17.0888671875, -16.55078125, -16.0126953125, -15.474609375, -14.9365234375, -14.3984375, -13.8603515625, -13.322265625, -12.7841796875, -12.24609375, -11.7080078125, -11.169921875, -10.6318359375, -10.09375, -9.5556640625, -9.017578125, -8.4794921875, -7.94140625, -7.4033203125, -6.865234375, -6.3271484375, -5.7890625, -5.2509765625, -4.712890625, -4.1748046875, -3.63671875, -3.0986328125, -2.560546875, -2.0224609375, -1.484375, -0.9462890625, -0.408203125, 0.1298828125, 0.66796875, 1.2060546875, 1.744140625, 2.2822265625, 2.8203125, 3.3583984375, 3.896484375, 4.4345703125, 4.97265625, 5.5107421875, 6.048828125, 6.5869140625, 7.125, 7.6630859375, 8.201171875, 8.7392578125, 9.27734375, 9.8154296875, 10.353515625, 10.8916015625, 11.4296875, 11.9677734375, 12.505859375, 13.0439453125, 13.58203125, 14.1201171875, 14.658203125, 15.1962890625, 15.734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 5.0, 16.0, 15.0, 9.0, 13.0, 23.0, 21.0, 32.0, 64.0, 108.0, 173.0, 151.0, 113.0, 59.0, 33.0, 21.0, 16.0, 14.0, 13.0, 7.0, 2.0, 7.0, 9.0, 4.0, 4.0, 4.0, 5.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.59375, -10.201416015625, -9.80908203125, -9.416748046875, -9.0244140625, -8.632080078125, -8.23974609375, -7.847412109375, -7.455078125, -7.062744140625, -6.67041015625, -6.278076171875, -5.8857421875, -5.493408203125, -5.10107421875, -4.708740234375, -4.31640625, -3.924072265625, -3.53173828125, -3.139404296875, -2.7470703125, -2.354736328125, -1.96240234375, -1.570068359375, -1.177734375, -0.785400390625, -0.39306640625, -0.000732421875, 0.3916015625, 0.783935546875, 1.17626953125, 1.568603515625, 1.9609375, 2.353271484375, 2.74560546875, 3.137939453125, 3.5302734375, 3.922607421875, 4.31494140625, 4.707275390625, 5.099609375, 5.491943359375, 5.88427734375, 6.276611328125, 6.6689453125, 7.061279296875, 7.45361328125, 7.845947265625, 8.23828125, 8.630615234375, 9.02294921875, 9.415283203125, 9.8076171875, 10.199951171875, 10.59228515625, 10.984619140625, 11.376953125, 11.769287109375, 12.16162109375, 12.553955078125, 12.9462890625, 13.338623046875, 13.73095703125, 14.123291015625, 14.515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 16.0, 15.0, 23.0, 54.0, 45.0, 83.0, 114.0, 126.0, 134.0, 110.0, 79.0, 67.0, 46.0, 38.0, 21.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-237.42584228515625, -230.86273193359375, -224.2996368408203, -217.73654174804688, -211.17343139648438, -204.61032104492188, -198.04722595214844, -191.484130859375, -184.9210205078125, -178.35791015625, -171.79481506347656, -165.23171997070312, -158.66860961914062, -152.10549926757812, -145.5424041748047, -138.97930908203125, -132.41619873046875, -125.85309600830078, -119.28999328613281, -112.72689056396484, -106.16378784179688, -99.6006851196289, -93.03758239746094, -86.47447967529297, -79.911376953125, -73.34827423095703, -66.78517150878906, -60.222068786621094, -53.658966064453125, -47.095863342285156, -40.53276062011719, -33.96965789794922, -27.40655517578125, -20.84345245361328, -14.280349731445312, -7.717247009277344, -1.154144287109375, 5.408958435058594, 11.972061157226562, 18.53516387939453, 25.0982666015625, 31.66136932373047, 38.22447204589844, 44.787574768066406, 51.350677490234375, 57.913780212402344, 64.47688293457031, 71.03998565673828, 77.60308837890625, 84.16619110107422, 90.72929382324219, 97.29239654541016, 103.85549926757812, 110.4186019897461, 116.98170471191406, 123.54480743408203, 130.10791015625, 136.6710205078125, 143.23411560058594, 149.79721069335938, 156.36032104492188, 162.92343139648438, 169.4865264892578, 176.04962158203125, 182.61273193359375]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 4.0, 8.0, 17.0, 16.0, 18.0, 23.0, 22.0, 20.0, 33.0, 33.0, 27.0, 36.0, 44.0, 52.0, 47.0, 51.0, 40.0, 36.0, 46.0, 36.0, 44.0, 40.0, 38.0, 28.0, 36.0, 25.0, 38.0, 17.0, 13.0, 22.0, 20.0, 13.0, 9.0, 10.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.8253173828125, -97.4686279296875, -94.1119384765625, -90.7552490234375, -87.3985595703125, -84.0418701171875, -80.6851806640625, -77.3284912109375, -73.9718017578125, -70.6151123046875, -67.2584228515625, -63.9017333984375, -60.5450439453125, -57.1883544921875, -53.8316650390625, -50.4749755859375, -47.118282318115234, -43.761592864990234, -40.404903411865234, -37.048213958740234, -33.691524505615234, -30.3348331451416, -26.9781436920166, -23.6214542388916, -20.2647647857666, -16.9080753326416, -13.551385879516602, -10.194695472717285, -6.838006019592285, -3.4813156127929688, -0.12462615966796875, 3.2320632934570312, 6.588752746582031, 9.945442199707031, 13.302131652832031, 16.65882110595703, 20.01551055908203, 23.372201919555664, 26.728891372680664, 30.085580825805664, 33.44226837158203, 36.79895782470703, 40.15564727783203, 43.51233673095703, 46.86902618408203, 50.22571563720703, 53.58240509033203, 56.93909454345703, 60.2957878112793, 63.6524772644043, 67.00917053222656, 70.36585998535156, 73.72254943847656, 77.07923889160156, 80.43592834472656, 83.79261779785156, 87.14930725097656, 90.50599670410156, 93.86268615722656, 97.21937561035156, 100.57606506347656, 103.93275451660156, 107.28944396972656, 110.64613342285156, 114.00282287597656]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 13.0, 22.0, 23.0, 39.0, 56.0, 93.0, 180.0, 313.0, 572.0, 1117.0, 2288.0, 4911.0, 10559.0, 25244.0, 68824.0, 288015.0, 3319646.0, 345903.0, 77073.0, 27521.0, 11509.0, 5141.0, 2485.0, 1242.0, 640.0, 319.0, 185.0, 109.0, 91.0, 35.0, 30.0, 26.0, 12.0, 12.0, 5.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.713623046875, -31.70849609375, -30.703369140625, -29.6982421875, -28.693115234375, -27.68798828125, -26.682861328125, -25.677734375, -24.672607421875, -23.66748046875, -22.662353515625, -21.6572265625, -20.652099609375, -19.64697265625, -18.641845703125, -17.63671875, -16.631591796875, -15.62646484375, -14.621337890625, -13.6162109375, -12.611083984375, -11.60595703125, -10.600830078125, -9.595703125, -8.590576171875, -7.58544921875, -6.580322265625, -5.5751953125, -4.570068359375, -3.56494140625, -2.559814453125, -1.5546875, -0.549560546875, 0.45556640625, 1.460693359375, 2.4658203125, 3.470947265625, 4.47607421875, 5.481201171875, 6.486328125, 7.491455078125, 8.49658203125, 9.501708984375, 10.5068359375, 11.511962890625, 12.51708984375, 13.522216796875, 14.52734375, 15.532470703125, 16.53759765625, 17.542724609375, 18.5478515625, 19.552978515625, 20.55810546875, 21.563232421875, 22.568359375, 23.573486328125, 24.57861328125, 25.583740234375, 26.5888671875, 27.593994140625, 28.59912109375, 29.604248046875, 30.609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 4.0, 12.0, 13.0, 16.0, 19.0, 16.0, 19.0, 28.0, 31.0, 34.0, 30.0, 35.0, 41.0, 42.0, 45.0, 48.0, 53.0, 41.0, 58.0, 45.0, 49.0, 46.0, 46.0, 43.0, 28.0, 22.0, 23.0, 23.0, 14.0, 11.0, 15.0, 9.0, 6.0, 8.0, 4.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.684814453125, -4.52197265625, -4.359130859375, -4.1962890625, -4.033447265625, -3.87060546875, -3.707763671875, -3.544921875, -3.382080078125, -3.21923828125, -3.056396484375, -2.8935546875, -2.730712890625, -2.56787109375, -2.405029296875, -2.2421875, -2.079345703125, -1.91650390625, -1.753662109375, -1.5908203125, -1.427978515625, -1.26513671875, -1.102294921875, -0.939453125, -0.776611328125, -0.61376953125, -0.450927734375, -0.2880859375, -0.125244140625, 0.03759765625, 0.200439453125, 0.36328125, 0.526123046875, 0.68896484375, 0.851806640625, 1.0146484375, 1.177490234375, 1.34033203125, 1.503173828125, 1.666015625, 1.828857421875, 1.99169921875, 2.154541015625, 2.3173828125, 2.480224609375, 2.64306640625, 2.805908203125, 2.96875, 3.131591796875, 3.29443359375, 3.457275390625, 3.6201171875, 3.782958984375, 3.94580078125, 4.108642578125, 4.271484375, 4.434326171875, 4.59716796875, 4.760009765625, 4.9228515625, 5.085693359375, 5.24853515625, 5.411376953125, 5.57421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 8.0, 16.0, 22.0, 32.0, 41.0, 59.0, 105.0, 170.0, 253.0, 382.0, 557.0, 824.0, 1361.0, 2158.0, 3878.0, 7259.0, 15879.0, 39632.0, 123335.0, 734130.0, 2928231.0, 228575.0, 62120.0, 22691.0, 10169.0, 5129.0, 2859.0, 1621.0, 971.0, 595.0, 400.0, 262.0, 183.0, 104.0, 82.0, 77.0, 22.0, 20.0, 20.0, 9.0, 18.0, 7.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.5, -34.39794921875, -33.2958984375, -32.19384765625, -31.091796875, -29.98974609375, -28.8876953125, -27.78564453125, -26.68359375, -25.58154296875, -24.4794921875, -23.37744140625, -22.275390625, -21.17333984375, -20.0712890625, -18.96923828125, -17.8671875, -16.76513671875, -15.6630859375, -14.56103515625, -13.458984375, -12.35693359375, -11.2548828125, -10.15283203125, -9.05078125, -7.94873046875, -6.8466796875, -5.74462890625, -4.642578125, -3.54052734375, -2.4384765625, -1.33642578125, -0.234375, 0.86767578125, 1.9697265625, 3.07177734375, 4.173828125, 5.27587890625, 6.3779296875, 7.47998046875, 8.58203125, 9.68408203125, 10.7861328125, 11.88818359375, 12.990234375, 14.09228515625, 15.1943359375, 16.29638671875, 17.3984375, 18.50048828125, 19.6025390625, 20.70458984375, 21.806640625, 22.90869140625, 24.0107421875, 25.11279296875, 26.21484375, 27.31689453125, 28.4189453125, 29.52099609375, 30.623046875, 31.72509765625, 32.8271484375, 33.92919921875, 35.03125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 3.0, 4.0, 4.0, 11.0, 12.0, 21.0, 23.0, 36.0, 74.0, 85.0, 176.0, 324.0, 1054.0, 1366.0, 355.0, 183.0, 107.0, 61.0, 46.0, 33.0, 30.0, 14.0, 12.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.046875, -17.4462890625, -16.845703125, -16.2451171875, -15.64453125, -15.0439453125, -14.443359375, -13.8427734375, -13.2421875, -12.6416015625, -12.041015625, -11.4404296875, -10.83984375, -10.2392578125, -9.638671875, -9.0380859375, -8.4375, -7.8369140625, -7.236328125, -6.6357421875, -6.03515625, -5.4345703125, -4.833984375, -4.2333984375, -3.6328125, -3.0322265625, -2.431640625, -1.8310546875, -1.23046875, -0.6298828125, -0.029296875, 0.5712890625, 1.171875, 1.7724609375, 2.373046875, 2.9736328125, 3.57421875, 4.1748046875, 4.775390625, 5.3759765625, 5.9765625, 6.5771484375, 7.177734375, 7.7783203125, 8.37890625, 8.9794921875, 9.580078125, 10.1806640625, 10.78125, 11.3818359375, 11.982421875, 12.5830078125, 13.18359375, 13.7841796875, 14.384765625, 14.9853515625, 15.5859375, 16.1865234375, 16.787109375, 17.3876953125, 17.98828125, 18.5888671875, 19.189453125, 19.7900390625, 20.390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 10.0, 10.0, 23.0, 37.0, 62.0, 77.0, 113.0, 113.0, 141.0, 131.0, 79.0, 73.0, 39.0, 40.0, 25.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.73176574707031, -97.88178253173828, -94.03179931640625, -90.18182373046875, -86.33184051513672, -82.48185729980469, -78.63187408447266, -74.78189086914062, -70.9319076538086, -67.08192443847656, -63.2319450378418, -59.381961822509766, -55.531978607177734, -51.68199920654297, -47.83201599121094, -43.982032775878906, -40.13205337524414, -36.28207015991211, -32.432090759277344, -28.582107543945312, -24.73212432861328, -20.882143020629883, -17.032161712646484, -13.182178497314453, -9.332197189331055, -5.48221492767334, -1.6322331428527832, 2.2177486419677734, 6.067730903625488, 9.917713165283203, 13.767694473266602, 17.617677688598633, 21.46765899658203, 25.31764030456543, 29.16762351989746, 33.01760482788086, 36.86758804321289, 40.717567443847656, 44.56755065917969, 48.41753387451172, 52.26751708984375, 56.11750030517578, 59.96747970581055, 63.81746292114258, 67.66744232177734, 71.51742553710938, 75.3674087524414, 79.21739196777344, 83.06736755371094, 86.91735076904297, 90.767333984375, 94.6173095703125, 98.46729278564453, 102.31727600097656, 106.1672592163086, 110.01724243164062, 113.86722564697266, 117.71720886230469, 121.56719207763672, 125.41717529296875, 129.26715087890625, 133.1171417236328, 136.9671173095703, 140.81710815429688, 144.66708374023438]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 6.0, 11.0, 18.0, 8.0, 14.0, 11.0, 21.0, 22.0, 19.0, 28.0, 33.0, 25.0, 33.0, 30.0, 30.0, 48.0, 31.0, 46.0, 50.0, 51.0, 43.0, 52.0, 41.0, 30.0, 32.0, 41.0, 16.0, 20.0, 27.0, 20.0, 13.0, 17.0, 18.0, 11.0, 12.0, 11.0, 6.0, 7.0, 5.0, 6.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-58.35264587402344, -56.58753967285156, -54.82243347167969, -53.05732345581055, -51.29221725463867, -49.5271110534668, -47.762001037597656, -45.99689483642578, -44.231788635253906, -42.46668243408203, -40.701576232910156, -38.936466217041016, -37.17136001586914, -35.406253814697266, -33.641143798828125, -31.87603759765625, -30.110931396484375, -28.3458251953125, -26.580717086791992, -24.815608978271484, -23.05050277709961, -21.285396575927734, -19.520288467407227, -17.75518035888672, -15.990074157714844, -14.224967002868652, -12.459859848022461, -10.69475269317627, -8.929645538330078, -7.164538383483887, -5.399431228637695, -3.634324073791504, -1.8692207336425781, -0.10411357879638672, 1.6609935760498047, 3.426100730895996, 5.1912078857421875, 6.956315040588379, 8.72142219543457, 10.486529350280762, 12.251636505126953, 14.016743659973145, 15.781850814819336, 17.546958923339844, 19.31206512451172, 21.077171325683594, 22.8422794342041, 24.60738754272461, 26.372493743896484, 28.13759994506836, 29.902708053588867, 31.667816162109375, 33.43292236328125, 35.198028564453125, 36.963134765625, 38.72824478149414, 40.493350982666016, 42.25845718383789, 44.02356719970703, 45.788673400878906, 47.55377960205078, 49.318885803222656, 51.08399200439453, 52.84910202026367, 54.61420822143555]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 8.0, 6.0, 5.0, 4.0, 15.0, 24.0, 23.0, 46.0, 60.0, 80.0, 129.0, 205.0, 324.0, 585.0, 1062.0, 1936.0, 3647.0, 7060.0, 13862.0, 26994.0, 52017.0, 99729.0, 212283.0, 308912.0, 157234.0, 77844.0, 40711.0, 21054.0, 10743.0, 5379.0, 2877.0, 1579.0, 849.0, 471.0, 285.0, 159.0, 101.0, 79.0, 45.0, 36.0, 19.0, 14.0, 19.0, 12.0, 9.0, 7.0, 6.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.03125, -19.429931640625, -18.82861328125, -18.227294921875, -17.6259765625, -17.024658203125, -16.42333984375, -15.822021484375, -15.220703125, -14.619384765625, -14.01806640625, -13.416748046875, -12.8154296875, -12.214111328125, -11.61279296875, -11.011474609375, -10.41015625, -9.808837890625, -9.20751953125, -8.606201171875, -8.0048828125, -7.403564453125, -6.80224609375, -6.200927734375, -5.599609375, -4.998291015625, -4.39697265625, -3.795654296875, -3.1943359375, -2.593017578125, -1.99169921875, -1.390380859375, -0.7890625, -0.187744140625, 0.41357421875, 1.014892578125, 1.6162109375, 2.217529296875, 2.81884765625, 3.420166015625, 4.021484375, 4.622802734375, 5.22412109375, 5.825439453125, 6.4267578125, 7.028076171875, 7.62939453125, 8.230712890625, 8.83203125, 9.433349609375, 10.03466796875, 10.635986328125, 11.2373046875, 11.838623046875, 12.43994140625, 13.041259765625, 13.642578125, 14.243896484375, 14.84521484375, 15.446533203125, 16.0478515625, 16.649169921875, 17.25048828125, 17.851806640625, 18.453125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 4.0, 7.0, 5.0, 11.0, 22.0, 11.0, 17.0, 28.0, 19.0, 29.0, 31.0, 24.0, 34.0, 35.0, 56.0, 49.0, 43.0, 59.0, 47.0, 43.0, 45.0, 61.0, 38.0, 41.0, 40.0, 32.0, 27.0, 23.0, 28.0, 19.0, 18.0, 14.0, 17.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.40606689453125, -5.1910400390625, -4.97601318359375, -4.760986328125, -4.54595947265625, -4.3309326171875, -4.11590576171875, -3.90087890625, -3.68585205078125, -3.4708251953125, -3.25579833984375, -3.040771484375, -2.82574462890625, -2.6107177734375, -2.39569091796875, -2.1806640625, -1.96563720703125, -1.7506103515625, -1.53558349609375, -1.320556640625, -1.10552978515625, -0.8905029296875, -0.67547607421875, -0.46044921875, -0.24542236328125, -0.0303955078125, 0.18463134765625, 0.399658203125, 0.61468505859375, 0.8297119140625, 1.04473876953125, 1.259765625, 1.47479248046875, 1.6898193359375, 1.90484619140625, 2.119873046875, 2.33489990234375, 2.5499267578125, 2.76495361328125, 2.97998046875, 3.19500732421875, 3.4100341796875, 3.62506103515625, 3.840087890625, 4.05511474609375, 4.2701416015625, 4.48516845703125, 4.7001953125, 4.91522216796875, 5.1302490234375, 5.34527587890625, 5.560302734375, 5.77532958984375, 5.9903564453125, 6.20538330078125, 6.42041015625, 6.63543701171875, 6.8504638671875, 7.06549072265625, 7.280517578125, 7.49554443359375, 7.7105712890625, 7.92559814453125, 8.140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 3.0, 10.0, 6.0, 14.0, 16.0, 29.0, 27.0, 32.0, 77.0, 85.0, 120.0, 181.0, 288.0, 499.0, 1016.0, 2216.0, 6702.0, 29668.0, 153558.0, 666412.0, 147907.0, 28644.0, 6472.0, 2170.0, 944.0, 529.0, 299.0, 221.0, 114.0, 97.0, 63.0, 40.0, 29.0, 18.0, 17.0, 11.0, 8.0, 7.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-45.28125, -43.84326171875, -42.4052734375, -40.96728515625, -39.529296875, -38.09130859375, -36.6533203125, -35.21533203125, -33.77734375, -32.33935546875, -30.9013671875, -29.46337890625, -28.025390625, -26.58740234375, -25.1494140625, -23.71142578125, -22.2734375, -20.83544921875, -19.3974609375, -17.95947265625, -16.521484375, -15.08349609375, -13.6455078125, -12.20751953125, -10.76953125, -9.33154296875, -7.8935546875, -6.45556640625, -5.017578125, -3.57958984375, -2.1416015625, -0.70361328125, 0.734375, 2.17236328125, 3.6103515625, 5.04833984375, 6.486328125, 7.92431640625, 9.3623046875, 10.80029296875, 12.23828125, 13.67626953125, 15.1142578125, 16.55224609375, 17.990234375, 19.42822265625, 20.8662109375, 22.30419921875, 23.7421875, 25.18017578125, 26.6181640625, 28.05615234375, 29.494140625, 30.93212890625, 32.3701171875, 33.80810546875, 35.24609375, 36.68408203125, 38.1220703125, 39.56005859375, 40.998046875, 42.43603515625, 43.8740234375, 45.31201171875, 46.75]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 4.0, 6.0, 9.0, 6.0, 13.0, 9.0, 8.0, 20.0, 20.0, 15.0, 24.0, 26.0, 25.0, 43.0, 41.0, 30.0, 44.0, 41.0, 49.0, 53.0, 54.0, 49.0, 42.0, 54.0, 41.0, 25.0, 47.0, 18.0, 26.0, 16.0, 20.0, 22.0, 17.0, 8.0, 15.0, 10.0, 10.0, 4.0, 3.0, 7.0, 3.0, 4.0, 6.0, 8.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-34.0625, -33.035888671875, -32.00927734375, -30.982666015625, -29.9560546875, -28.929443359375, -27.90283203125, -26.876220703125, -25.849609375, -24.822998046875, -23.79638671875, -22.769775390625, -21.7431640625, -20.716552734375, -19.68994140625, -18.663330078125, -17.63671875, -16.610107421875, -15.58349609375, -14.556884765625, -13.5302734375, -12.503662109375, -11.47705078125, -10.450439453125, -9.423828125, -8.397216796875, -7.37060546875, -6.343994140625, -5.3173828125, -4.290771484375, -3.26416015625, -2.237548828125, -1.2109375, -0.184326171875, 0.84228515625, 1.868896484375, 2.8955078125, 3.922119140625, 4.94873046875, 5.975341796875, 7.001953125, 8.028564453125, 9.05517578125, 10.081787109375, 11.1083984375, 12.135009765625, 13.16162109375, 14.188232421875, 15.21484375, 16.241455078125, 17.26806640625, 18.294677734375, 19.3212890625, 20.347900390625, 21.37451171875, 22.401123046875, 23.427734375, 24.454345703125, 25.48095703125, 26.507568359375, 27.5341796875, 28.560791015625, 29.58740234375, 30.614013671875, 31.640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 3.0, 7.0, 5.0, 10.0, 8.0, 10.0, 20.0, 49.0, 76.0, 142.0, 287.0, 679.0, 1635.0, 4485.0, 15226.0, 70702.0, 416399.0, 441991.0, 73538.0, 15622.0, 4570.0, 1723.0, 687.0, 334.0, 149.0, 72.0, 42.0, 27.0, 15.0, 9.0, 8.0, 8.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.608154296875, -20.88818359375, -20.168212890625, -19.4482421875, -18.728271484375, -18.00830078125, -17.288330078125, -16.568359375, -15.848388671875, -15.12841796875, -14.408447265625, -13.6884765625, -12.968505859375, -12.24853515625, -11.528564453125, -10.80859375, -10.088623046875, -9.36865234375, -8.648681640625, -7.9287109375, -7.208740234375, -6.48876953125, -5.768798828125, -5.048828125, -4.328857421875, -3.60888671875, -2.888916015625, -2.1689453125, -1.448974609375, -0.72900390625, -0.009033203125, 0.7109375, 1.430908203125, 2.15087890625, 2.870849609375, 3.5908203125, 4.310791015625, 5.03076171875, 5.750732421875, 6.470703125, 7.190673828125, 7.91064453125, 8.630615234375, 9.3505859375, 10.070556640625, 10.79052734375, 11.510498046875, 12.23046875, 12.950439453125, 13.67041015625, 14.390380859375, 15.1103515625, 15.830322265625, 16.55029296875, 17.270263671875, 17.990234375, 18.710205078125, 19.43017578125, 20.150146484375, 20.8701171875, 21.590087890625, 22.31005859375, 23.030029296875, 23.75]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 3.0, 10.0, 10.0, 16.0, 12.0, 11.0, 27.0, 31.0, 44.0, 45.0, 81.0, 160.0, 169.0, 86.0, 60.0, 41.0, 33.0, 31.0, 21.0, 28.0, 15.0, 5.0, 7.0, 10.0, 5.0, 6.0, 4.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.005039215087890625, -0.004900127649307251, -0.004761040210723877, -0.004621952772140503, -0.004482865333557129, -0.004343777894973755, -0.004204690456390381, -0.004065603017807007, -0.003926515579223633, -0.003787428140640259, -0.0036483407020568848, -0.0035092532634735107, -0.0033701658248901367, -0.0032310783863067627, -0.0030919909477233887, -0.0029529035091400146, -0.0028138160705566406, -0.0026747286319732666, -0.0025356411933898926, -0.0023965537548065186, -0.0022574663162231445, -0.0021183788776397705, -0.0019792914390563965, -0.0018402040004730225, -0.0017011165618896484, -0.0015620291233062744, -0.0014229416847229004, -0.0012838542461395264, -0.0011447668075561523, -0.0010056793689727783, -0.0008665919303894043, -0.0007275044918060303, -0.0005884170532226562, -0.0004493296146392822, -0.0003102421760559082, -0.00017115473747253418, -3.2067298889160156e-05, 0.00010702013969421387, 0.0002461075782775879, 0.0003851950168609619, 0.0005242824554443359, 0.00066336989402771, 0.000802457332611084, 0.000941544771194458, 0.001080632209777832, 0.001219719648361206, 0.00135880708694458, 0.001497894525527954, 0.0016369819641113281, 0.0017760694026947021, 0.0019151568412780762, 0.00205424427986145, 0.0021933317184448242, 0.0023324191570281982, 0.0024715065956115723, 0.0026105940341949463, 0.0027496814727783203, 0.0028887689113616943, 0.0030278563499450684, 0.0031669437885284424, 0.0033060312271118164, 0.0034451186656951904, 0.0035842061042785645, 0.0037232935428619385, 0.0038623809814453125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 4.0, 7.0, 6.0, 7.0, 14.0, 25.0, 35.0, 70.0, 120.0, 187.0, 355.0, 670.0, 1642.0, 4303.0, 15361.0, 80878.0, 523244.0, 351322.0, 53262.0, 11127.0, 3259.0, 1322.0, 597.0, 293.0, 182.0, 78.0, 59.0, 32.0, 23.0, 15.0, 11.0, 11.0, 7.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.28125, -24.462646484375, -23.64404296875, -22.825439453125, -22.0068359375, -21.188232421875, -20.36962890625, -19.551025390625, -18.732421875, -17.913818359375, -17.09521484375, -16.276611328125, -15.4580078125, -14.639404296875, -13.82080078125, -13.002197265625, -12.18359375, -11.364990234375, -10.54638671875, -9.727783203125, -8.9091796875, -8.090576171875, -7.27197265625, -6.453369140625, -5.634765625, -4.816162109375, -3.99755859375, -3.178955078125, -2.3603515625, -1.541748046875, -0.72314453125, 0.095458984375, 0.9140625, 1.732666015625, 2.55126953125, 3.369873046875, 4.1884765625, 5.007080078125, 5.82568359375, 6.644287109375, 7.462890625, 8.281494140625, 9.10009765625, 9.918701171875, 10.7373046875, 11.555908203125, 12.37451171875, 13.193115234375, 14.01171875, 14.830322265625, 15.64892578125, 16.467529296875, 17.2861328125, 18.104736328125, 18.92333984375, 19.741943359375, 20.560546875, 21.379150390625, 22.19775390625, 23.016357421875, 23.8349609375, 24.653564453125, 25.47216796875, 26.290771484375, 27.109375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 3.0, 6.0, 8.0, 12.0, 13.0, 15.0, 19.0, 30.0, 33.0, 29.0, 48.0, 64.0, 77.0, 89.0, 96.0, 95.0, 73.0, 49.0, 60.0, 26.0, 31.0, 29.0, 17.0, 20.0, 12.0, 10.0, 5.0, 5.0, 3.0, 3.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.400146484375, -15.86279296875, -15.325439453125, -14.7880859375, -14.250732421875, -13.71337890625, -13.176025390625, -12.638671875, -12.101318359375, -11.56396484375, -11.026611328125, -10.4892578125, -9.951904296875, -9.41455078125, -8.877197265625, -8.33984375, -7.802490234375, -7.26513671875, -6.727783203125, -6.1904296875, -5.653076171875, -5.11572265625, -4.578369140625, -4.041015625, -3.503662109375, -2.96630859375, -2.428955078125, -1.8916015625, -1.354248046875, -0.81689453125, -0.279541015625, 0.2578125, 0.795166015625, 1.33251953125, 1.869873046875, 2.4072265625, 2.944580078125, 3.48193359375, 4.019287109375, 4.556640625, 5.093994140625, 5.63134765625, 6.168701171875, 6.7060546875, 7.243408203125, 7.78076171875, 8.318115234375, 8.85546875, 9.392822265625, 9.93017578125, 10.467529296875, 11.0048828125, 11.542236328125, 12.07958984375, 12.616943359375, 13.154296875, 13.691650390625, 14.22900390625, 14.766357421875, 15.3037109375, 15.841064453125, 16.37841796875, 16.915771484375, 17.453125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 11.0, 16.0, 15.0, 25.0, 63.0, 101.0, 110.0, 130.0, 120.0, 113.0, 99.0, 82.0, 51.0, 22.0, 15.0, 9.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-358.5999755859375, -349.4037170410156, -340.2074890136719, -331.01123046875, -321.81500244140625, -312.6187438964844, -303.4224853515625, -294.22625732421875, -285.0299987792969, -275.833740234375, -266.63751220703125, -257.4412536621094, -248.24501037597656, -239.04876708984375, -229.85250854492188, -220.65626525878906, -211.46002197265625, -202.26377868652344, -193.06753540039062, -183.87127685546875, -174.67503356933594, -165.47879028320312, -156.28253173828125, -147.08628845214844, -137.89004516601562, -128.6938018798828, -119.49755096435547, -110.30130004882812, -101.10505676269531, -91.9088134765625, -82.71256256103516, -73.51631164550781, -64.32005310058594, -55.12380599975586, -45.92755889892578, -36.7313117980957, -27.535064697265625, -18.338817596435547, -9.142570495605469, 0.053680419921875, 9.249923706054688, 18.446170806884766, 27.642417907714844, 36.83866500854492, 46.034912109375, 55.23115921020508, 64.42740631103516, 73.6236572265625, 82.81990051269531, 92.01614379882812, 101.21239471435547, 110.40864562988281, 119.60488891601562, 128.80113220214844, 137.99737548828125, 147.19363403320312, 156.38987731933594, 165.58612060546875, 174.78237915039062, 183.97862243652344, 193.17486572265625, 202.37110900878906, 211.56735229492188, 220.76361083984375, 229.95985412597656]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 12.0, 10.0, 8.0, 8.0, 13.0, 10.0, 17.0, 12.0, 20.0, 14.0, 27.0, 34.0, 20.0, 39.0, 29.0, 45.0, 47.0, 40.0, 41.0, 51.0, 33.0, 43.0, 40.0, 47.0, 34.0, 45.0, 35.0, 31.0, 27.0, 26.0, 15.0, 21.0, 18.0, 16.0, 16.0, 12.0, 7.0, 5.0, 5.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.96075439453125, -151.72427368164062, -146.48779296875, -141.25131225585938, -136.01483154296875, -130.77835083007812, -125.5418701171875, -120.30538940429688, -115.06890869140625, -109.83242797851562, -104.595947265625, -99.35946655273438, -94.12298583984375, -88.88650512695312, -83.6500244140625, -78.41354370117188, -73.17705535888672, -67.9405746459961, -62.70409393310547, -57.467613220214844, -52.23113250732422, -46.994651794433594, -41.7581672668457, -36.52168655395508, -31.285205841064453, -26.048725128173828, -20.812244415283203, -15.575761795043945, -10.33928108215332, -5.102800369262695, 0.1336822509765625, 5.3701629638671875, 10.606643676757812, 15.843124389648438, 21.079605102539062, 26.31608772277832, 31.552568435668945, 36.78904724121094, 42.02553176879883, 47.26201248168945, 52.49849319458008, 57.7349739074707, 62.97145462036133, 68.20793914794922, 73.44441986083984, 78.68090057373047, 83.9173812866211, 89.15386199951172, 94.39034271240234, 99.62682342529297, 104.8633041381836, 110.09978485107422, 115.33626556396484, 120.57274627685547, 125.80923461914062, 131.04571533203125, 136.28219604492188, 141.5186767578125, 146.75515747070312, 151.99163818359375, 157.22811889648438, 162.464599609375, 167.70108032226562, 172.93756103515625, 178.17404174804688]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 4.0, 7.0, 7.0, 17.0, 24.0, 38.0, 43.0, 73.0, 110.0, 140.0, 244.0, 357.0, 576.0, 868.0, 1383.0, 2236.0, 3462.0, 5888.0, 10770.0, 20655.0, 42684.0, 103015.0, 332606.0, 2792714.0, 609992.0, 149825.0, 57973.0, 26559.0, 13499.0, 7284.0, 4271.0, 2574.0, 1583.0, 944.0, 660.0, 417.0, 264.0, 180.0, 117.0, 83.0, 47.0, 31.0, 20.0, 12.0, 10.0, 6.0, 1.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-23.046875, -22.341552734375, -21.63623046875, -20.930908203125, -20.2255859375, -19.520263671875, -18.81494140625, -18.109619140625, -17.404296875, -16.698974609375, -15.99365234375, -15.288330078125, -14.5830078125, -13.877685546875, -13.17236328125, -12.467041015625, -11.76171875, -11.056396484375, -10.35107421875, -9.645751953125, -8.9404296875, -8.235107421875, -7.52978515625, -6.824462890625, -6.119140625, -5.413818359375, -4.70849609375, -4.003173828125, -3.2978515625, -2.592529296875, -1.88720703125, -1.181884765625, -0.4765625, 0.228759765625, 0.93408203125, 1.639404296875, 2.3447265625, 3.050048828125, 3.75537109375, 4.460693359375, 5.166015625, 5.871337890625, 6.57666015625, 7.281982421875, 7.9873046875, 8.692626953125, 9.39794921875, 10.103271484375, 10.80859375, 11.513916015625, 12.21923828125, 12.924560546875, 13.6298828125, 14.335205078125, 15.04052734375, 15.745849609375, 16.451171875, 17.156494140625, 17.86181640625, 18.567138671875, 19.2724609375, 19.977783203125, 20.68310546875, 21.388427734375, 22.09375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 9.0, 10.0, 8.0, 8.0, 11.0, 18.0, 15.0, 12.0, 18.0, 31.0, 22.0, 26.0, 29.0, 43.0, 48.0, 37.0, 41.0, 41.0, 47.0, 47.0, 37.0, 42.0, 42.0, 39.0, 55.0, 38.0, 31.0, 28.0, 24.0, 17.0, 18.0, 17.0, 12.0, 11.0, 8.0, 15.0, 8.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.18359375, -5.98406982421875, -5.7845458984375, -5.58502197265625, -5.385498046875, -5.18597412109375, -4.9864501953125, -4.78692626953125, -4.58740234375, -4.38787841796875, -4.1883544921875, -3.98883056640625, -3.789306640625, -3.58978271484375, -3.3902587890625, -3.19073486328125, -2.9912109375, -2.79168701171875, -2.5921630859375, -2.39263916015625, -2.193115234375, -1.99359130859375, -1.7940673828125, -1.59454345703125, -1.39501953125, -1.19549560546875, -0.9959716796875, -0.79644775390625, -0.596923828125, -0.39739990234375, -0.1978759765625, 0.00164794921875, 0.201171875, 0.40069580078125, 0.6002197265625, 0.79974365234375, 0.999267578125, 1.19879150390625, 1.3983154296875, 1.59783935546875, 1.79736328125, 1.99688720703125, 2.1964111328125, 2.39593505859375, 2.595458984375, 2.79498291015625, 2.9945068359375, 3.19403076171875, 3.3935546875, 3.59307861328125, 3.7926025390625, 3.99212646484375, 4.191650390625, 4.39117431640625, 4.5906982421875, 4.79022216796875, 4.98974609375, 5.18927001953125, 5.3887939453125, 5.58831787109375, 5.787841796875, 5.98736572265625, 6.1868896484375, 6.38641357421875, 6.5859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 8.0, 7.0, 14.0, 28.0, 22.0, 32.0, 52.0, 78.0, 118.0, 164.0, 303.0, 400.0, 677.0, 1279.0, 2683.0, 6104.0, 16319.0, 55536.0, 311242.0, 3352508.0, 356454.0, 60388.0, 17249.0, 6412.0, 2821.0, 1366.0, 731.0, 421.0, 304.0, 188.0, 123.0, 78.0, 66.0, 44.0, 17.0, 13.0, 8.0, 13.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5625, -50.8408203125, -49.119140625, -47.3974609375, -45.67578125, -43.9541015625, -42.232421875, -40.5107421875, -38.7890625, -37.0673828125, -35.345703125, -33.6240234375, -31.90234375, -30.1806640625, -28.458984375, -26.7373046875, -25.015625, -23.2939453125, -21.572265625, -19.8505859375, -18.12890625, -16.4072265625, -14.685546875, -12.9638671875, -11.2421875, -9.5205078125, -7.798828125, -6.0771484375, -4.35546875, -2.6337890625, -0.912109375, 0.8095703125, 2.53125, 4.2529296875, 5.974609375, 7.6962890625, 9.41796875, 11.1396484375, 12.861328125, 14.5830078125, 16.3046875, 18.0263671875, 19.748046875, 21.4697265625, 23.19140625, 24.9130859375, 26.634765625, 28.3564453125, 30.078125, 31.7998046875, 33.521484375, 35.2431640625, 36.96484375, 38.6865234375, 40.408203125, 42.1298828125, 43.8515625, 45.5732421875, 47.294921875, 49.0166015625, 50.73828125, 52.4599609375, 54.181640625, 55.9033203125, 57.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 8.0, 4.0, 17.0, 8.0, 16.0, 24.0, 24.0, 42.0, 54.0, 79.0, 155.0, 281.0, 636.0, 1503.0, 542.0, 265.0, 142.0, 83.0, 59.0, 31.0, 29.0, 22.0, 12.0, 10.0, 8.0, 7.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.171875, -29.366455078125, -28.56103515625, -27.755615234375, -26.9501953125, -26.144775390625, -25.33935546875, -24.533935546875, -23.728515625, -22.923095703125, -22.11767578125, -21.312255859375, -20.5068359375, -19.701416015625, -18.89599609375, -18.090576171875, -17.28515625, -16.479736328125, -15.67431640625, -14.868896484375, -14.0634765625, -13.258056640625, -12.45263671875, -11.647216796875, -10.841796875, -10.036376953125, -9.23095703125, -8.425537109375, -7.6201171875, -6.814697265625, -6.00927734375, -5.203857421875, -4.3984375, -3.593017578125, -2.78759765625, -1.982177734375, -1.1767578125, -0.371337890625, 0.43408203125, 1.239501953125, 2.044921875, 2.850341796875, 3.65576171875, 4.461181640625, 5.2666015625, 6.072021484375, 6.87744140625, 7.682861328125, 8.48828125, 9.293701171875, 10.09912109375, 10.904541015625, 11.7099609375, 12.515380859375, 13.32080078125, 14.126220703125, 14.931640625, 15.737060546875, 16.54248046875, 17.347900390625, 18.1533203125, 18.958740234375, 19.76416015625, 20.569580078125, 21.375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 7.0, 13.0, 13.0, 33.0, 45.0, 75.0, 107.0, 94.0, 109.0, 117.0, 94.0, 87.0, 65.0, 47.0, 33.0, 26.0, 11.0, 7.0, 6.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.55540466308594, -134.26116943359375, -128.96693420410156, -123.6727066040039, -118.37847900390625, -113.08424377441406, -107.79000854492188, -102.49578094482422, -97.20155334472656, -91.90731811523438, -86.61309051513672, -81.31885528564453, -76.02462768554688, -70.73039245605469, -65.4361572265625, -60.141929626464844, -54.847694396972656, -49.553462982177734, -44.25923156738281, -38.964996337890625, -33.67076873779297, -28.376535415649414, -23.08230209350586, -17.788070678710938, -12.493839263916016, -7.1996073722839355, -1.9053754806518555, 3.388856887817383, 8.683088302612305, 13.977319717407227, 19.27155303955078, 24.565784454345703, 29.860015869140625, 35.15424728393555, 40.44847869873047, 45.742713928222656, 51.03694152832031, 56.3311767578125, 61.62540817260742, 66.91963958740234, 72.2138671875, 77.50810241699219, 82.80233001708984, 88.09656524658203, 93.39079284667969, 98.68502807617188, 103.97926330566406, 109.27349090576172, 114.5677261352539, 119.8619613647461, 125.15618896484375, 130.45042419433594, 135.74465942382812, 141.03887939453125, 146.33311462402344, 151.62734985351562, 156.9215850830078, 162.2158203125, 167.5100555419922, 172.8042755126953, 178.0985107421875, 183.3927459716797, 188.68698120117188, 193.981201171875, 199.2754364013672]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 4.0, 9.0, 8.0, 13.0, 16.0, 11.0, 18.0, 20.0, 23.0, 37.0, 37.0, 41.0, 32.0, 29.0, 42.0, 45.0, 51.0, 40.0, 59.0, 52.0, 49.0, 44.0, 45.0, 25.0, 37.0, 26.0, 27.0, 22.0, 20.0, 16.0, 26.0, 18.0, 9.0, 10.0, 7.0, 7.0, 3.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.6792221069336, -80.02071380615234, -77.3622055053711, -74.70369720458984, -72.0451889038086, -69.38668060302734, -66.7281723022461, -64.06967163085938, -61.41115951538086, -58.75265121459961, -56.09414291381836, -53.43563461303711, -50.777130126953125, -48.118621826171875, -45.460113525390625, -42.801605224609375, -40.143096923828125, -37.484588623046875, -34.826080322265625, -32.167572021484375, -29.509065628051758, -26.850557327270508, -24.19205093383789, -21.53354263305664, -18.87503433227539, -16.21652603149414, -13.558018684387207, -10.899511337280273, -8.241003036499023, -5.582494735717773, -2.92398738861084, -0.26548004150390625, 2.3930282592773438, 5.0515360832214355, 7.710043907165527, 10.368551254272461, 13.027059555053711, 15.685567855834961, 18.344074249267578, 21.002582550048828, 23.661090850830078, 26.319599151611328, 28.978107452392578, 31.636613845825195, 34.29512023925781, 36.95362854003906, 39.61213684082031, 42.27064514160156, 44.92915344238281, 47.58766174316406, 50.24617004394531, 52.90467834472656, 55.56318664550781, 58.22169494628906, 60.88019943237305, 63.5387077331543, 66.19721984863281, 68.85572814941406, 71.51423645019531, 74.17274475097656, 76.83125305175781, 79.48976135253906, 82.14826965332031, 84.80677795410156, 87.46527862548828]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 14.0, 17.0, 13.0, 39.0, 31.0, 72.0, 73.0, 134.0, 208.0, 263.0, 438.0, 763.0, 1208.0, 2179.0, 4013.0, 7395.0, 14004.0, 29473.0, 62589.0, 133566.0, 246375.0, 260315.0, 148172.0, 70217.0, 32852.0, 15825.0, 8033.0, 4352.0, 2284.0, 1345.0, 811.0, 529.0, 318.0, 200.0, 140.0, 90.0, 68.0, 38.0, 28.0, 20.0, 17.0, 2.0, 10.0, 3.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.4375, -19.80029296875, -19.1630859375, -18.52587890625, -17.888671875, -17.25146484375, -16.6142578125, -15.97705078125, -15.33984375, -14.70263671875, -14.0654296875, -13.42822265625, -12.791015625, -12.15380859375, -11.5166015625, -10.87939453125, -10.2421875, -9.60498046875, -8.9677734375, -8.33056640625, -7.693359375, -7.05615234375, -6.4189453125, -5.78173828125, -5.14453125, -4.50732421875, -3.8701171875, -3.23291015625, -2.595703125, -1.95849609375, -1.3212890625, -0.68408203125, -0.046875, 0.59033203125, 1.2275390625, 1.86474609375, 2.501953125, 3.13916015625, 3.7763671875, 4.41357421875, 5.05078125, 5.68798828125, 6.3251953125, 6.96240234375, 7.599609375, 8.23681640625, 8.8740234375, 9.51123046875, 10.1484375, 10.78564453125, 11.4228515625, 12.06005859375, 12.697265625, 13.33447265625, 13.9716796875, 14.60888671875, 15.24609375, 15.88330078125, 16.5205078125, 17.15771484375, 17.794921875, 18.43212890625, 19.0693359375, 19.70654296875, 20.34375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 9.0, 6.0, 9.0, 3.0, 5.0, 11.0, 14.0, 14.0, 20.0, 31.0, 31.0, 32.0, 36.0, 42.0, 34.0, 39.0, 45.0, 37.0, 56.0, 49.0, 51.0, 38.0, 47.0, 45.0, 47.0, 39.0, 37.0, 36.0, 17.0, 22.0, 19.0, 20.0, 14.0, 14.0, 8.0, 8.0, 5.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.4609375, -9.1990966796875, -8.937255859375, -8.6754150390625, -8.41357421875, -8.1517333984375, -7.889892578125, -7.6280517578125, -7.3662109375, -7.1043701171875, -6.842529296875, -6.5806884765625, -6.31884765625, -6.0570068359375, -5.795166015625, -5.5333251953125, -5.271484375, -5.0096435546875, -4.747802734375, -4.4859619140625, -4.22412109375, -3.9622802734375, -3.700439453125, -3.4385986328125, -3.1767578125, -2.9149169921875, -2.653076171875, -2.3912353515625, -2.12939453125, -1.8675537109375, -1.605712890625, -1.3438720703125, -1.08203125, -0.8201904296875, -0.558349609375, -0.2965087890625, -0.03466796875, 0.2271728515625, 0.489013671875, 0.7508544921875, 1.0126953125, 1.2745361328125, 1.536376953125, 1.7982177734375, 2.06005859375, 2.3218994140625, 2.583740234375, 2.8455810546875, 3.107421875, 3.3692626953125, 3.631103515625, 3.8929443359375, 4.15478515625, 4.4166259765625, 4.678466796875, 4.9403076171875, 5.2021484375, 5.4639892578125, 5.725830078125, 5.9876708984375, 6.24951171875, 6.5113525390625, 6.773193359375, 7.0350341796875, 7.296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 14.0, 18.0, 22.0, 36.0, 46.0, 91.0, 118.0, 193.0, 295.0, 506.0, 965.0, 2415.0, 9078.0, 54429.0, 436372.0, 470176.0, 59100.0, 9756.0, 2530.0, 1023.0, 519.0, 274.0, 206.0, 114.0, 70.0, 52.0, 39.0, 32.0, 14.0, 8.0, 12.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.71875, -47.0400390625, -45.361328125, -43.6826171875, -42.00390625, -40.3251953125, -38.646484375, -36.9677734375, -35.2890625, -33.6103515625, -31.931640625, -30.2529296875, -28.57421875, -26.8955078125, -25.216796875, -23.5380859375, -21.859375, -20.1806640625, -18.501953125, -16.8232421875, -15.14453125, -13.4658203125, -11.787109375, -10.1083984375, -8.4296875, -6.7509765625, -5.072265625, -3.3935546875, -1.71484375, -0.0361328125, 1.642578125, 3.3212890625, 5.0, 6.6787109375, 8.357421875, 10.0361328125, 11.71484375, 13.3935546875, 15.072265625, 16.7509765625, 18.4296875, 20.1083984375, 21.787109375, 23.4658203125, 25.14453125, 26.8232421875, 28.501953125, 30.1806640625, 31.859375, 33.5380859375, 35.216796875, 36.8955078125, 38.57421875, 40.2529296875, 41.931640625, 43.6103515625, 45.2890625, 46.9677734375, 48.646484375, 50.3251953125, 52.00390625, 53.6826171875, 55.361328125, 57.0400390625, 58.71875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 11.0, 7.0, 6.0, 24.0, 13.0, 17.0, 25.0, 21.0, 25.0, 26.0, 42.0, 36.0, 45.0, 37.0, 44.0, 44.0, 42.0, 49.0, 59.0, 38.0, 53.0, 36.0, 43.0, 33.0, 37.0, 27.0, 25.0, 23.0, 23.0, 22.0, 10.0, 12.0, 9.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.21875, -38.80517578125, -37.3916015625, -35.97802734375, -34.564453125, -33.15087890625, -31.7373046875, -30.32373046875, -28.91015625, -27.49658203125, -26.0830078125, -24.66943359375, -23.255859375, -21.84228515625, -20.4287109375, -19.01513671875, -17.6015625, -16.18798828125, -14.7744140625, -13.36083984375, -11.947265625, -10.53369140625, -9.1201171875, -7.70654296875, -6.29296875, -4.87939453125, -3.4658203125, -2.05224609375, -0.638671875, 0.77490234375, 2.1884765625, 3.60205078125, 5.015625, 6.42919921875, 7.8427734375, 9.25634765625, 10.669921875, 12.08349609375, 13.4970703125, 14.91064453125, 16.32421875, 17.73779296875, 19.1513671875, 20.56494140625, 21.978515625, 23.39208984375, 24.8056640625, 26.21923828125, 27.6328125, 29.04638671875, 30.4599609375, 31.87353515625, 33.287109375, 34.70068359375, 36.1142578125, 37.52783203125, 38.94140625, 40.35498046875, 41.7685546875, 43.18212890625, 44.595703125, 46.00927734375, 47.4228515625, 48.83642578125, 50.25]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 14.0, 17.0, 20.0, 39.0, 73.0, 205.0, 1092.0, 17702.0, 893993.0, 131355.0, 3375.0, 448.0, 101.0, 49.0, 25.0, 16.0, 13.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.25, -79.7373046875, -77.224609375, -74.7119140625, -72.19921875, -69.6865234375, -67.173828125, -64.6611328125, -62.1484375, -59.6357421875, -57.123046875, -54.6103515625, -52.09765625, -49.5849609375, -47.072265625, -44.5595703125, -42.046875, -39.5341796875, -37.021484375, -34.5087890625, -31.99609375, -29.4833984375, -26.970703125, -24.4580078125, -21.9453125, -19.4326171875, -16.919921875, -14.4072265625, -11.89453125, -9.3818359375, -6.869140625, -4.3564453125, -1.84375, 0.6689453125, 3.181640625, 5.6943359375, 8.20703125, 10.7197265625, 13.232421875, 15.7451171875, 18.2578125, 20.7705078125, 23.283203125, 25.7958984375, 28.30859375, 30.8212890625, 33.333984375, 35.8466796875, 38.359375, 40.8720703125, 43.384765625, 45.8974609375, 48.41015625, 50.9228515625, 53.435546875, 55.9482421875, 58.4609375, 60.9736328125, 63.486328125, 65.9990234375, 68.51171875, 71.0244140625, 73.537109375, 76.0498046875, 78.5625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 6.0, 13.0, 10.0, 13.0, 25.0, 27.0, 44.0, 40.0, 49.0, 56.0, 81.0, 91.0, 111.0, 86.0, 67.0, 43.0, 50.0, 44.0, 29.0, 25.0, 18.0, 8.0, 12.0, 8.0, 3.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004119873046875, -0.003968477249145508, -0.0038170814514160156, -0.0036656856536865234, -0.0035142898559570312, -0.003362894058227539, -0.003211498260498047, -0.0030601024627685547, -0.0029087066650390625, -0.0027573108673095703, -0.002605915069580078, -0.002454519271850586, -0.0023031234741210938, -0.0021517276763916016, -0.0020003318786621094, -0.0018489360809326172, -0.001697540283203125, -0.0015461444854736328, -0.0013947486877441406, -0.0012433528900146484, -0.0010919570922851562, -0.0009405612945556641, -0.0007891654968261719, -0.0006377696990966797, -0.0004863739013671875, -0.0003349781036376953, -0.00018358230590820312, -3.218650817871094e-05, 0.00011920928955078125, 0.00027060508728027344, 0.0004220008850097656, 0.0005733966827392578, 0.00072479248046875, 0.0008761882781982422, 0.0010275840759277344, 0.0011789798736572266, 0.0013303756713867188, 0.001481771469116211, 0.0016331672668457031, 0.0017845630645751953, 0.0019359588623046875, 0.0020873546600341797, 0.002238750457763672, 0.002390146255493164, 0.0025415420532226562, 0.0026929378509521484, 0.0028443336486816406, 0.002995729446411133, 0.003147125244140625, 0.003298521041870117, 0.0034499168395996094, 0.0036013126373291016, 0.0037527084350585938, 0.003904104232788086, 0.004055500030517578, 0.00420689582824707, 0.0043582916259765625, 0.004509687423706055, 0.004661083221435547, 0.004812479019165039, 0.004963874816894531, 0.0051152706146240234, 0.005266666412353516, 0.005418062210083008, 0.0055694580078125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 5.0, 4.0, 11.0, 11.0, 22.0, 20.0, 40.0, 65.0, 130.0, 212.0, 513.0, 1267.0, 3715.0, 14455.0, 96760.0, 653102.0, 240841.0, 27933.0, 6134.0, 1947.0, 687.0, 331.0, 129.0, 84.0, 44.0, 22.0, 15.0, 14.0, 8.0, 11.0, 3.0, 4.0, 3.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.609375, -29.504150390625, -28.39892578125, -27.293701171875, -26.1884765625, -25.083251953125, -23.97802734375, -22.872802734375, -21.767578125, -20.662353515625, -19.55712890625, -18.451904296875, -17.3466796875, -16.241455078125, -15.13623046875, -14.031005859375, -12.92578125, -11.820556640625, -10.71533203125, -9.610107421875, -8.5048828125, -7.399658203125, -6.29443359375, -5.189208984375, -4.083984375, -2.978759765625, -1.87353515625, -0.768310546875, 0.3369140625, 1.442138671875, 2.54736328125, 3.652587890625, 4.7578125, 5.863037109375, 6.96826171875, 8.073486328125, 9.1787109375, 10.283935546875, 11.38916015625, 12.494384765625, 13.599609375, 14.704833984375, 15.81005859375, 16.915283203125, 18.0205078125, 19.125732421875, 20.23095703125, 21.336181640625, 22.44140625, 23.546630859375, 24.65185546875, 25.757080078125, 26.8623046875, 27.967529296875, 29.07275390625, 30.177978515625, 31.283203125, 32.388427734375, 33.49365234375, 34.598876953125, 35.7041015625, 36.809326171875, 37.91455078125, 39.019775390625, 40.125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 11.0, 10.0, 20.0, 24.0, 63.0, 93.0, 116.0, 133.0, 136.0, 133.0, 95.0, 47.0, 51.0, 29.0, 12.0, 13.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.390625, -28.346923828125, -27.30322265625, -26.259521484375, -25.2158203125, -24.172119140625, -23.12841796875, -22.084716796875, -21.041015625, -19.997314453125, -18.95361328125, -17.909912109375, -16.8662109375, -15.822509765625, -14.77880859375, -13.735107421875, -12.69140625, -11.647705078125, -10.60400390625, -9.560302734375, -8.5166015625, -7.472900390625, -6.42919921875, -5.385498046875, -4.341796875, -3.298095703125, -2.25439453125, -1.210693359375, -0.1669921875, 0.876708984375, 1.92041015625, 2.964111328125, 4.0078125, 5.051513671875, 6.09521484375, 7.138916015625, 8.1826171875, 9.226318359375, 10.27001953125, 11.313720703125, 12.357421875, 13.401123046875, 14.44482421875, 15.488525390625, 16.5322265625, 17.575927734375, 18.61962890625, 19.663330078125, 20.70703125, 21.750732421875, 22.79443359375, 23.838134765625, 24.8818359375, 25.925537109375, 26.96923828125, 28.012939453125, 29.056640625, 30.100341796875, 31.14404296875, 32.187744140625, 33.2314453125, 34.275146484375, 35.31884765625, 36.362548828125, 37.40625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 7.0, 29.0, 111.0, 353.0, 370.0, 119.0, 20.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.05770874023438, -214.02015686035156, -178.98260498046875, -143.94505310058594, -108.90750122070312, -73.86994934082031, -38.8323974609375, -3.7948455810546875, 31.242706298828125, 66.28025817871094, 101.31781005859375, 136.35536193847656, 171.39291381835938, 206.4304656982422, 241.468017578125, 276.50555419921875, 311.5431213378906, 346.5806884765625, 381.61822509765625, 416.65576171875, 451.6933288574219, 486.73089599609375, 521.7684326171875, 556.8059692382812, 591.843505859375, 626.8810424804688, 661.9185791015625, 696.9561767578125, 731.9937133789062, 767.03125, 802.06884765625, 837.1063842773438, 872.1439208984375, 907.1814575195312, 942.218994140625, 977.256591796875, 1012.2941284179688, 1047.3316650390625, 1082.3692626953125, 1117.40673828125, 1152.4443359375, 1187.48193359375, 1222.5194091796875, 1257.5570068359375, 1292.594482421875, 1327.632080078125, 1362.669677734375, 1397.7071533203125, 1432.7447509765625, 1467.7823486328125, 1502.81982421875, 1537.857421875, 1572.89501953125, 1607.9324951171875, 1642.9700927734375, 1678.007568359375, 1713.045166015625, 1748.082763671875, 1783.1202392578125, 1818.1578369140625, 1853.1953125, 1888.23291015625, 1923.2705078125, 1958.3079833984375, 1993.3455810546875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 8.0, 6.0, 9.0, 9.0, 5.0, 14.0, 6.0, 12.0, 9.0, 26.0, 24.0, 30.0, 22.0, 27.0, 34.0, 36.0, 41.0, 37.0, 47.0, 43.0, 52.0, 49.0, 43.0, 41.0, 46.0, 44.0, 37.0, 36.0, 38.0, 30.0, 17.0, 21.0, 11.0, 14.0, 14.0, 17.0, 6.0, 14.0, 12.0, 3.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-222.6886749267578, -215.6664581298828, -208.6442413330078, -201.6220245361328, -194.5998077392578, -187.5775909423828, -180.55535888671875, -173.53314208984375, -166.51092529296875, -159.48870849609375, -152.46649169921875, -145.44427490234375, -138.42205810546875, -131.39984130859375, -124.37761688232422, -117.35540008544922, -110.33319091796875, -103.31097412109375, -96.28875732421875, -89.26654052734375, -82.24432373046875, -75.22210693359375, -68.19988250732422, -61.17766571044922, -54.15544891357422, -47.13323211669922, -40.11101531982422, -33.08879470825195, -26.066577911376953, -19.044361114501953, -12.022140502929688, -4.9999237060546875, 2.022308349609375, 9.044526100158691, 16.066743850708008, 23.08896255493164, 30.11117935180664, 37.13339614868164, 44.155616760253906, 51.177833557128906, 58.200050354003906, 65.2222671508789, 72.2444839477539, 79.26670837402344, 86.28892517089844, 93.31114196777344, 100.33335876464844, 107.35557556152344, 114.37779235839844, 121.40000915527344, 128.42222595214844, 135.44444274902344, 142.46665954589844, 149.48887634277344, 156.5111083984375, 163.5333251953125, 170.5555419921875, 177.5777587890625, 184.5999755859375, 191.6221923828125, 198.6444091796875, 205.6666259765625, 212.6888427734375, 219.7110595703125, 226.7332763671875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 8.0, 9.0, 13.0, 21.0, 22.0, 31.0, 38.0, 69.0, 89.0, 142.0, 153.0, 243.0, 403.0, 540.0, 948.0, 1575.0, 3070.0, 6191.0, 16092.0, 66717.0, 3891421.0, 163629.0, 25702.0, 8409.0, 3651.0, 1986.0, 1156.0, 608.0, 438.0, 266.0, 184.0, 131.0, 83.0, 69.0, 46.0, 28.0, 21.0, 13.0, 16.0, 15.0, 11.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-48.1875, -46.71337890625, -45.2392578125, -43.76513671875, -42.291015625, -40.81689453125, -39.3427734375, -37.86865234375, -36.39453125, -34.92041015625, -33.4462890625, -31.97216796875, -30.498046875, -29.02392578125, -27.5498046875, -26.07568359375, -24.6015625, -23.12744140625, -21.6533203125, -20.17919921875, -18.705078125, -17.23095703125, -15.7568359375, -14.28271484375, -12.80859375, -11.33447265625, -9.8603515625, -8.38623046875, -6.912109375, -5.43798828125, -3.9638671875, -2.48974609375, -1.015625, 0.45849609375, 1.9326171875, 3.40673828125, 4.880859375, 6.35498046875, 7.8291015625, 9.30322265625, 10.77734375, 12.25146484375, 13.7255859375, 15.19970703125, 16.673828125, 18.14794921875, 19.6220703125, 21.09619140625, 22.5703125, 24.04443359375, 25.5185546875, 26.99267578125, 28.466796875, 29.94091796875, 31.4150390625, 32.88916015625, 34.36328125, 35.83740234375, 37.3115234375, 38.78564453125, 40.259765625, 41.73388671875, 43.2080078125, 44.68212890625, 46.15625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 9.0, 2.0, 4.0, 16.0, 13.0, 17.0, 30.0, 26.0, 37.0, 31.0, 32.0, 44.0, 57.0, 53.0, 61.0, 53.0, 49.0, 57.0, 54.0, 56.0, 47.0, 38.0, 34.0, 35.0, 30.0, 29.0, 26.0, 8.0, 17.0, 8.0, 11.0, 4.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.0701904296875, -9.726318359375, -9.3824462890625, -9.03857421875, -8.6947021484375, -8.350830078125, -8.0069580078125, -7.6630859375, -7.3192138671875, -6.975341796875, -6.6314697265625, -6.28759765625, -5.9437255859375, -5.599853515625, -5.2559814453125, -4.912109375, -4.5682373046875, -4.224365234375, -3.8804931640625, -3.53662109375, -3.1927490234375, -2.848876953125, -2.5050048828125, -2.1611328125, -1.8172607421875, -1.473388671875, -1.1295166015625, -0.78564453125, -0.4417724609375, -0.097900390625, 0.2459716796875, 0.58984375, 0.9337158203125, 1.277587890625, 1.6214599609375, 1.96533203125, 2.3092041015625, 2.653076171875, 2.9969482421875, 3.3408203125, 3.6846923828125, 4.028564453125, 4.3724365234375, 4.71630859375, 5.0601806640625, 5.404052734375, 5.7479248046875, 6.091796875, 6.4356689453125, 6.779541015625, 7.1234130859375, 7.46728515625, 7.8111572265625, 8.155029296875, 8.4989013671875, 8.8427734375, 9.1866455078125, 9.530517578125, 9.8743896484375, 10.21826171875, 10.5621337890625, 10.906005859375, 11.2498779296875, 11.59375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 4.0, 7.0, 6.0, 11.0, 18.0, 25.0, 41.0, 42.0, 70.0, 109.0, 149.0, 214.0, 335.0, 542.0, 896.0, 1565.0, 3238.0, 7489.0, 32374.0, 3946760.0, 174303.0, 15362.0, 5042.0, 2470.0, 1231.0, 696.0, 428.0, 281.0, 200.0, 104.0, 84.0, 53.0, 39.0, 27.0, 17.0, 21.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-111.9375, -108.89453125, -105.8515625, -102.80859375, -99.765625, -96.72265625, -93.6796875, -90.63671875, -87.59375, -84.55078125, -81.5078125, -78.46484375, -75.421875, -72.37890625, -69.3359375, -66.29296875, -63.25, -60.20703125, -57.1640625, -54.12109375, -51.078125, -48.03515625, -44.9921875, -41.94921875, -38.90625, -35.86328125, -32.8203125, -29.77734375, -26.734375, -23.69140625, -20.6484375, -17.60546875, -14.5625, -11.51953125, -8.4765625, -5.43359375, -2.390625, 0.65234375, 3.6953125, 6.73828125, 9.78125, 12.82421875, 15.8671875, 18.91015625, 21.953125, 24.99609375, 28.0390625, 31.08203125, 34.125, 37.16796875, 40.2109375, 43.25390625, 46.296875, 49.33984375, 52.3828125, 55.42578125, 58.46875, 61.51171875, 64.5546875, 67.59765625, 70.640625, 73.68359375, 76.7265625, 79.76953125, 82.8125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 11.0, 9.0, 15.0, 37.0, 85.0, 439.0, 3191.0, 152.0, 54.0, 32.0, 9.0, 7.0, 6.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.28125, -23.6627197265625, -23.044189453125, -22.4256591796875, -21.80712890625, -21.1885986328125, -20.570068359375, -19.9515380859375, -19.3330078125, -18.7144775390625, -18.095947265625, -17.4774169921875, -16.85888671875, -16.2403564453125, -15.621826171875, -15.0032958984375, -14.384765625, -13.7662353515625, -13.147705078125, -12.5291748046875, -11.91064453125, -11.2921142578125, -10.673583984375, -10.0550537109375, -9.4365234375, -8.8179931640625, -8.199462890625, -7.5809326171875, -6.96240234375, -6.3438720703125, -5.725341796875, -5.1068115234375, -4.48828125, -3.8697509765625, -3.251220703125, -2.6326904296875, -2.01416015625, -1.3956298828125, -0.777099609375, -0.1585693359375, 0.4599609375, 1.0784912109375, 1.697021484375, 2.3155517578125, 2.93408203125, 3.5526123046875, 4.171142578125, 4.7896728515625, 5.408203125, 6.0267333984375, 6.645263671875, 7.2637939453125, 7.88232421875, 8.5008544921875, 9.119384765625, 9.7379150390625, 10.3564453125, 10.9749755859375, 11.593505859375, 12.2120361328125, 12.83056640625, 13.4490966796875, 14.067626953125, 14.6861572265625, 15.3046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 3.0, 3.0, 5.0, 7.0, 9.0, 14.0, 23.0, 34.0, 35.0, 46.0, 54.0, 71.0, 80.0, 77.0, 97.0, 90.0, 79.0, 72.0, 66.0, 30.0, 32.0, 21.0, 17.0, 7.0, 5.0, 11.0, 3.0, 7.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.845252990722656, -47.290611267089844, -45.73596954345703, -44.18132781982422, -42.626686096191406, -41.072044372558594, -39.51740264892578, -37.96276092529297, -36.408119201660156, -34.853477478027344, -33.29883575439453, -31.74419403076172, -30.189552307128906, -28.634910583496094, -27.08026885986328, -25.52562713623047, -23.970985412597656, -22.416343688964844, -20.86170196533203, -19.30706024169922, -17.752418518066406, -16.197776794433594, -14.643135070800781, -13.088493347167969, -11.533851623535156, -9.979209899902344, -8.424568176269531, -6.869926452636719, -5.315284729003906, -3.7606430053710938, -2.2060012817382812, -0.6513595581054688, 0.9032821655273438, 2.4579238891601562, 4.012565612792969, 5.567207336425781, 7.121849060058594, 8.676490783691406, 10.231132507324219, 11.785774230957031, 13.340415954589844, 14.895057678222656, 16.44969940185547, 18.00434112548828, 19.558982849121094, 21.113624572753906, 22.66826629638672, 24.22290802001953, 25.777549743652344, 27.332191467285156, 28.88683319091797, 30.44147491455078, 31.996116638183594, 33.550758361816406, 35.10540008544922, 36.66004180908203, 38.214683532714844, 39.769325256347656, 41.32396697998047, 42.87860870361328, 44.433250427246094, 45.987892150878906, 47.54253387451172, 49.09717559814453, 50.651817321777344]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 2.0, 9.0, 7.0, 17.0, 19.0, 15.0, 18.0, 23.0, 23.0, 34.0, 35.0, 33.0, 42.0, 37.0, 41.0, 46.0, 41.0, 36.0, 57.0, 40.0, 35.0, 44.0, 33.0, 32.0, 44.0, 28.0, 21.0, 34.0, 22.0, 24.0, 19.0, 14.0, 11.0, 7.0, 14.0, 7.0, 6.0, 4.0, 7.0, 1.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.44331359863281, -32.43024826049805, -31.417186737060547, -30.404123306274414, -29.39105987548828, -28.377994537353516, -27.364931106567383, -26.35186767578125, -25.338804244995117, -24.325740814208984, -23.31267738342285, -22.29961395263672, -21.286548614501953, -20.273487091064453, -19.260421752929688, -18.247358322143555, -17.234294891357422, -16.22123146057129, -15.208168029785156, -14.195103645324707, -13.182040214538574, -12.168976783752441, -11.155912399291992, -10.14284896850586, -9.129785537719727, -8.116722106933594, -7.103658199310303, -6.090594291687012, -5.077530860900879, -4.064467430114746, -3.051403522491455, -2.038339614868164, -1.025278091430664, -0.012214422225952148, 1.0008492469787598, 2.0139129161834717, 3.0269765853881836, 4.040040016174316, 5.053103923797607, 6.066167831420898, 7.079231262207031, 8.092294692993164, 9.105358123779297, 10.118422508239746, 11.131485939025879, 12.144549369812012, 13.157613754272461, 14.170677185058594, 15.183740615844727, 16.19680404663086, 17.209867477416992, 18.222930908203125, 19.23599624633789, 20.24905776977539, 21.262123107910156, 22.27518653869629, 23.288249969482422, 24.301313400268555, 25.314376831054688, 26.32744026184082, 27.340503692626953, 28.35356903076172, 29.36663246154785, 30.379695892333984, 31.392759323120117]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 6.0, 10.0, 7.0, 10.0, 19.0, 17.0, 21.0, 54.0, 63.0, 111.0, 189.0, 384.0, 715.0, 1520.0, 3047.0, 7063.0, 16051.0, 38311.0, 90190.0, 198487.0, 299391.0, 216272.0, 101196.0, 42568.0, 18012.0, 7930.0, 3448.0, 1672.0, 807.0, 395.0, 217.0, 133.0, 82.0, 58.0, 30.0, 17.0, 10.0, 11.0, 14.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.78125, -26.95361328125, -26.1259765625, -25.29833984375, -24.470703125, -23.64306640625, -22.8154296875, -21.98779296875, -21.16015625, -20.33251953125, -19.5048828125, -18.67724609375, -17.849609375, -17.02197265625, -16.1943359375, -15.36669921875, -14.5390625, -13.71142578125, -12.8837890625, -12.05615234375, -11.228515625, -10.40087890625, -9.5732421875, -8.74560546875, -7.91796875, -7.09033203125, -6.2626953125, -5.43505859375, -4.607421875, -3.77978515625, -2.9521484375, -2.12451171875, -1.296875, -0.46923828125, 0.3583984375, 1.18603515625, 2.013671875, 2.84130859375, 3.6689453125, 4.49658203125, 5.32421875, 6.15185546875, 6.9794921875, 7.80712890625, 8.634765625, 9.46240234375, 10.2900390625, 11.11767578125, 11.9453125, 12.77294921875, 13.6005859375, 14.42822265625, 15.255859375, 16.08349609375, 16.9111328125, 17.73876953125, 18.56640625, 19.39404296875, 20.2216796875, 21.04931640625, 21.876953125, 22.70458984375, 23.5322265625, 24.35986328125, 25.1875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 10.0, 3.0, 6.0, 10.0, 18.0, 14.0, 8.0, 20.0, 28.0, 19.0, 29.0, 26.0, 39.0, 50.0, 40.0, 37.0, 50.0, 46.0, 46.0, 50.0, 38.0, 33.0, 44.0, 51.0, 40.0, 41.0, 30.0, 26.0, 26.0, 20.0, 25.0, 15.0, 11.0, 16.0, 7.0, 8.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.140625, -10.7989501953125, -10.457275390625, -10.1156005859375, -9.77392578125, -9.4322509765625, -9.090576171875, -8.7489013671875, -8.4072265625, -8.0655517578125, -7.723876953125, -7.3822021484375, -7.04052734375, -6.6988525390625, -6.357177734375, -6.0155029296875, -5.673828125, -5.3321533203125, -4.990478515625, -4.6488037109375, -4.30712890625, -3.9654541015625, -3.623779296875, -3.2821044921875, -2.9404296875, -2.5987548828125, -2.257080078125, -1.9154052734375, -1.57373046875, -1.2320556640625, -0.890380859375, -0.5487060546875, -0.20703125, 0.1346435546875, 0.476318359375, 0.8179931640625, 1.15966796875, 1.5013427734375, 1.843017578125, 2.1846923828125, 2.5263671875, 2.8680419921875, 3.209716796875, 3.5513916015625, 3.89306640625, 4.2347412109375, 4.576416015625, 4.9180908203125, 5.259765625, 5.6014404296875, 5.943115234375, 6.2847900390625, 6.62646484375, 6.9681396484375, 7.309814453125, 7.6514892578125, 7.9931640625, 8.3348388671875, 8.676513671875, 9.0181884765625, 9.35986328125, 9.7015380859375, 10.043212890625, 10.3848876953125, 10.7265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 11.0, 20.0, 18.0, 16.0, 36.0, 44.0, 47.0, 87.0, 117.0, 201.0, 309.0, 511.0, 898.0, 1882.0, 5285.0, 20928.0, 111081.0, 535714.0, 301739.0, 51881.0, 11157.0, 3371.0, 1320.0, 675.0, 391.0, 274.0, 158.0, 110.0, 70.0, 50.0, 32.0, 27.0, 25.0, 18.0, 12.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.8125, -46.25927734375, -44.7060546875, -43.15283203125, -41.599609375, -40.04638671875, -38.4931640625, -36.93994140625, -35.38671875, -33.83349609375, -32.2802734375, -30.72705078125, -29.173828125, -27.62060546875, -26.0673828125, -24.51416015625, -22.9609375, -21.40771484375, -19.8544921875, -18.30126953125, -16.748046875, -15.19482421875, -13.6416015625, -12.08837890625, -10.53515625, -8.98193359375, -7.4287109375, -5.87548828125, -4.322265625, -2.76904296875, -1.2158203125, 0.33740234375, 1.890625, 3.44384765625, 4.9970703125, 6.55029296875, 8.103515625, 9.65673828125, 11.2099609375, 12.76318359375, 14.31640625, 15.86962890625, 17.4228515625, 18.97607421875, 20.529296875, 22.08251953125, 23.6357421875, 25.18896484375, 26.7421875, 28.29541015625, 29.8486328125, 31.40185546875, 32.955078125, 34.50830078125, 36.0615234375, 37.61474609375, 39.16796875, 40.72119140625, 42.2744140625, 43.82763671875, 45.380859375, 46.93408203125, 48.4873046875, 50.04052734375, 51.59375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 13.0, 8.0, 10.0, 11.0, 17.0, 20.0, 13.0, 25.0, 18.0, 21.0, 33.0, 35.0, 42.0, 47.0, 44.0, 44.0, 44.0, 29.0, 41.0, 44.0, 37.0, 46.0, 45.0, 28.0, 39.0, 26.0, 20.0, 19.0, 23.0, 24.0, 14.0, 17.0, 13.0, 12.0, 7.0, 12.0, 5.0, 9.0, 7.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-53.125, -51.4990234375, -49.873046875, -48.2470703125, -46.62109375, -44.9951171875, -43.369140625, -41.7431640625, -40.1171875, -38.4912109375, -36.865234375, -35.2392578125, -33.61328125, -31.9873046875, -30.361328125, -28.7353515625, -27.109375, -25.4833984375, -23.857421875, -22.2314453125, -20.60546875, -18.9794921875, -17.353515625, -15.7275390625, -14.1015625, -12.4755859375, -10.849609375, -9.2236328125, -7.59765625, -5.9716796875, -4.345703125, -2.7197265625, -1.09375, 0.5322265625, 2.158203125, 3.7841796875, 5.41015625, 7.0361328125, 8.662109375, 10.2880859375, 11.9140625, 13.5400390625, 15.166015625, 16.7919921875, 18.41796875, 20.0439453125, 21.669921875, 23.2958984375, 24.921875, 26.5478515625, 28.173828125, 29.7998046875, 31.42578125, 33.0517578125, 34.677734375, 36.3037109375, 37.9296875, 39.5556640625, 41.181640625, 42.8076171875, 44.43359375, 46.0595703125, 47.685546875, 49.3115234375, 50.9375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 14.0, 8.0, 7.0, 11.0, 14.0, 21.0, 22.0, 46.0, 64.0, 94.0, 116.0, 167.0, 299.0, 507.0, 994.0, 2096.0, 5164.0, 17974.0, 87761.0, 493517.0, 357726.0, 60521.0, 13458.0, 4130.0, 1719.0, 854.0, 449.0, 253.0, 160.0, 118.0, 79.0, 50.0, 40.0, 30.0, 16.0, 16.0, 8.0, 7.0, 5.0, 7.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.765625, -30.855224609375, -29.94482421875, -29.034423828125, -28.1240234375, -27.213623046875, -26.30322265625, -25.392822265625, -24.482421875, -23.572021484375, -22.66162109375, -21.751220703125, -20.8408203125, -19.930419921875, -19.02001953125, -18.109619140625, -17.19921875, -16.288818359375, -15.37841796875, -14.468017578125, -13.5576171875, -12.647216796875, -11.73681640625, -10.826416015625, -9.916015625, -9.005615234375, -8.09521484375, -7.184814453125, -6.2744140625, -5.364013671875, -4.45361328125, -3.543212890625, -2.6328125, -1.722412109375, -0.81201171875, 0.098388671875, 1.0087890625, 1.919189453125, 2.82958984375, 3.739990234375, 4.650390625, 5.560791015625, 6.47119140625, 7.381591796875, 8.2919921875, 9.202392578125, 10.11279296875, 11.023193359375, 11.93359375, 12.843994140625, 13.75439453125, 14.664794921875, 15.5751953125, 16.485595703125, 17.39599609375, 18.306396484375, 19.216796875, 20.127197265625, 21.03759765625, 21.947998046875, 22.8583984375, 23.768798828125, 24.67919921875, 25.589599609375, 26.5]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 17.0, 31.0, 50.0, 63.0, 100.0, 163.0, 158.0, 161.0, 104.0, 64.0, 33.0, 20.0, 16.0, 7.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038547515869140625, -0.003567427396774292, -0.0032801032066345215, -0.002992779016494751, -0.0027054548263549805, -0.00241813063621521, -0.0021308064460754395, -0.001843482255935669, -0.0015561580657958984, -0.001268833875656128, -0.0009815096855163574, -0.0006941854953765869, -0.0004068613052368164, -0.0001195371150970459, 0.0001677870750427246, 0.0004551112651824951, 0.0007424354553222656, 0.0010297596454620361, 0.0013170838356018066, 0.0016044080257415771, 0.0018917322158813477, 0.002179056406021118, 0.0024663805961608887, 0.002753704786300659, 0.0030410289764404297, 0.0033283531665802, 0.0036156773567199707, 0.003903001546859741, 0.004190325736999512, 0.004477649927139282, 0.004764974117279053, 0.005052298307418823, 0.005339622497558594, 0.005626946687698364, 0.005914270877838135, 0.006201595067977905, 0.006488919258117676, 0.006776243448257446, 0.007063567638397217, 0.007350891828536987, 0.007638216018676758, 0.007925540208816528, 0.008212864398956299, 0.00850018858909607, 0.00878751277923584, 0.00907483696937561, 0.00936216115951538, 0.009649485349655151, 0.009936809539794922, 0.010224133729934692, 0.010511457920074463, 0.010798782110214233, 0.011086106300354004, 0.011373430490493774, 0.011660754680633545, 0.011948078870773315, 0.012235403060913086, 0.012522727251052856, 0.012810051441192627, 0.013097375631332397, 0.013384699821472168, 0.013672024011611938, 0.013959348201751709, 0.01424667239189148, 0.01453399658203125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 8.0, 11.0, 23.0, 27.0, 56.0, 93.0, 158.0, 417.0, 1338.0, 5796.0, 54647.0, 755532.0, 213199.0, 13681.0, 2390.0, 682.0, 243.0, 125.0, 54.0, 25.0, 16.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5, -36.876953125, -35.25390625, -33.630859375, -32.0078125, -30.384765625, -28.76171875, -27.138671875, -25.515625, -23.892578125, -22.26953125, -20.646484375, -19.0234375, -17.400390625, -15.77734375, -14.154296875, -12.53125, -10.908203125, -9.28515625, -7.662109375, -6.0390625, -4.416015625, -2.79296875, -1.169921875, 0.453125, 2.076171875, 3.69921875, 5.322265625, 6.9453125, 8.568359375, 10.19140625, 11.814453125, 13.4375, 15.060546875, 16.68359375, 18.306640625, 19.9296875, 21.552734375, 23.17578125, 24.798828125, 26.421875, 28.044921875, 29.66796875, 31.291015625, 32.9140625, 34.537109375, 36.16015625, 37.783203125, 39.40625, 41.029296875, 42.65234375, 44.275390625, 45.8984375, 47.521484375, 49.14453125, 50.767578125, 52.390625, 54.013671875, 55.63671875, 57.259765625, 58.8828125, 60.505859375, 62.12890625, 63.751953125, 65.375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 9.0, 17.0, 22.0, 23.0, 31.0, 47.0, 60.0, 75.0, 101.0, 107.0, 98.0, 87.0, 76.0, 72.0, 62.0, 23.0, 17.0, 21.0, 13.0, 5.0, 10.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.515625, -22.552001953125, -21.58837890625, -20.624755859375, -19.6611328125, -18.697509765625, -17.73388671875, -16.770263671875, -15.806640625, -14.843017578125, -13.87939453125, -12.915771484375, -11.9521484375, -10.988525390625, -10.02490234375, -9.061279296875, -8.09765625, -7.134033203125, -6.17041015625, -5.206787109375, -4.2431640625, -3.279541015625, -2.31591796875, -1.352294921875, -0.388671875, 0.574951171875, 1.53857421875, 2.502197265625, 3.4658203125, 4.429443359375, 5.39306640625, 6.356689453125, 7.3203125, 8.283935546875, 9.24755859375, 10.211181640625, 11.1748046875, 12.138427734375, 13.10205078125, 14.065673828125, 15.029296875, 15.992919921875, 16.95654296875, 17.920166015625, 18.8837890625, 19.847412109375, 20.81103515625, 21.774658203125, 22.73828125, 23.701904296875, 24.66552734375, 25.629150390625, 26.5927734375, 27.556396484375, 28.52001953125, 29.483642578125, 30.447265625, 31.410888671875, 32.37451171875, 33.338134765625, 34.3017578125, 35.265380859375, 36.22900390625, 37.192626953125, 38.15625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 23.0, 78.0, 147.0, 215.0, 246.0, 185.0, 64.0, 28.0, 13.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-492.8465576171875, -466.9833679199219, -441.12017822265625, -415.25701904296875, -389.3938293457031, -363.5306396484375, -337.6674499511719, -311.80426025390625, -285.94110107421875, -260.0779113769531, -234.21473693847656, -208.35154724121094, -182.48837280273438, -156.62518310546875, -130.76199340820312, -104.89881896972656, -79.03561401367188, -53.17243194580078, -27.309246063232422, -1.4460601806640625, 24.41712188720703, 50.280303955078125, 76.14349365234375, 102.00666809082031, 127.86985778808594, 153.73304748535156, 179.59622192382812, 205.45941162109375, 231.32260131835938, 257.185791015625, 283.0489501953125, 308.9121398925781, 334.77532958984375, 360.6385192871094, 386.501708984375, 412.3648681640625, 438.2280578613281, 464.09124755859375, 489.9544372558594, 515.817626953125, 541.6807861328125, 567.5439453125, 593.4071655273438, 619.2703247070312, 645.133544921875, 670.9967041015625, 696.85986328125, 722.7230834960938, 748.5863037109375, 774.449462890625, 800.3126831054688, 826.1758422851562, 852.0390625, 877.9022216796875, 903.765380859375, 929.6286010742188, 955.4917602539062, 981.3549194335938, 1007.2181396484375, 1033.081298828125, 1058.9444580078125, 1084.8076171875, 1110.6708984375, 1136.5340576171875, 1162.397216796875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 14.0, 9.0, 13.0, 10.0, 10.0, 20.0, 29.0, 23.0, 28.0, 34.0, 31.0, 34.0, 29.0, 45.0, 57.0, 44.0, 58.0, 42.0, 55.0, 55.0, 35.0, 39.0, 35.0, 35.0, 30.0, 31.0, 22.0, 19.0, 22.0, 11.0, 12.0, 16.0, 8.0, 1.0, 10.0, 10.0, 2.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-319.8168640136719, -310.1666259765625, -300.5163879394531, -290.8661193847656, -281.21588134765625, -271.5656433105469, -261.9154052734375, -252.26516723632812, -242.6149139404297, -232.9646759033203, -223.31442260742188, -213.6641845703125, -204.01394653320312, -194.3636932373047, -184.7134552001953, -175.06320190429688, -165.4129638671875, -155.76272583007812, -146.1124725341797, -136.4622344970703, -126.8119888305664, -117.1617431640625, -107.51150512695312, -97.86125946044922, -88.21101379394531, -78.5607681274414, -68.9105224609375, -59.260284423828125, -49.61003875732422, -39.95979309082031, -30.309551239013672, -20.65930938720703, -11.009033203125, -1.3587894439697266, 8.291454315185547, 17.94169807434082, 27.591941833496094, 37.2421875, 46.89242935180664, 56.54267120361328, 66.19291687011719, 75.8431625366211, 85.493408203125, 95.14364624023438, 104.79389190673828, 114.44413757324219, 124.09437561035156, 133.74462890625, 143.39486694335938, 153.04510498046875, 162.6953582763672, 172.34559631347656, 181.995849609375, 191.64608764648438, 201.29632568359375, 210.94656372070312, 220.59681701660156, 230.24705505371094, 239.89730834960938, 249.54754638671875, 259.1977844238281, 268.8480224609375, 278.498291015625, 288.1485290527344, 297.79876708984375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 9.0, 8.0, 12.0, 19.0, 31.0, 41.0, 61.0, 85.0, 182.0, 280.0, 457.0, 704.0, 1273.0, 2368.0, 5206.0, 12895.0, 44610.0, 3607607.0, 460871.0, 36902.0, 11067.0, 4517.0, 2115.0, 1086.0, 695.0, 394.0, 260.0, 176.0, 119.0, 84.0, 60.0, 30.0, 24.0, 15.0, 7.0, 10.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.375, -46.64306640625, -44.9111328125, -43.17919921875, -41.447265625, -39.71533203125, -37.9833984375, -36.25146484375, -34.51953125, -32.78759765625, -31.0556640625, -29.32373046875, -27.591796875, -25.85986328125, -24.1279296875, -22.39599609375, -20.6640625, -18.93212890625, -17.2001953125, -15.46826171875, -13.736328125, -12.00439453125, -10.2724609375, -8.54052734375, -6.80859375, -5.07666015625, -3.3447265625, -1.61279296875, 0.119140625, 1.85107421875, 3.5830078125, 5.31494140625, 7.046875, 8.77880859375, 10.5107421875, 12.24267578125, 13.974609375, 15.70654296875, 17.4384765625, 19.17041015625, 20.90234375, 22.63427734375, 24.3662109375, 26.09814453125, 27.830078125, 29.56201171875, 31.2939453125, 33.02587890625, 34.7578125, 36.48974609375, 38.2216796875, 39.95361328125, 41.685546875, 43.41748046875, 45.1494140625, 46.88134765625, 48.61328125, 50.34521484375, 52.0771484375, 53.80908203125, 55.541015625, 57.27294921875, 59.0048828125, 60.73681640625, 62.46875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 8.0, 14.0, 15.0, 21.0, 26.0, 18.0, 31.0, 33.0, 37.0, 52.0, 60.0, 52.0, 64.0, 64.0, 64.0, 81.0, 59.0, 46.0, 58.0, 48.0, 27.0, 30.0, 19.0, 14.0, 15.0, 19.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.84375, -17.3697509765625, -16.895751953125, -16.4217529296875, -15.94775390625, -15.4737548828125, -14.999755859375, -14.5257568359375, -14.0517578125, -13.5777587890625, -13.103759765625, -12.6297607421875, -12.15576171875, -11.6817626953125, -11.207763671875, -10.7337646484375, -10.259765625, -9.7857666015625, -9.311767578125, -8.8377685546875, -8.36376953125, -7.8897705078125, -7.415771484375, -6.9417724609375, -6.4677734375, -5.9937744140625, -5.519775390625, -5.0457763671875, -4.57177734375, -4.0977783203125, -3.623779296875, -3.1497802734375, -2.67578125, -2.2017822265625, -1.727783203125, -1.2537841796875, -0.77978515625, -0.3057861328125, 0.168212890625, 0.6422119140625, 1.1162109375, 1.5902099609375, 2.064208984375, 2.5382080078125, 3.01220703125, 3.4862060546875, 3.960205078125, 4.4342041015625, 4.908203125, 5.3822021484375, 5.856201171875, 6.3302001953125, 6.80419921875, 7.2781982421875, 7.752197265625, 8.2261962890625, 8.7001953125, 9.1741943359375, 9.648193359375, 10.1221923828125, 10.59619140625, 11.0701904296875, 11.544189453125, 12.0181884765625, 12.4921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 15.0, 18.0, 24.0, 29.0, 40.0, 52.0, 95.0, 101.0, 155.0, 290.0, 474.0, 772.0, 1440.0, 2915.0, 6860.0, 20913.0, 119885.0, 3913240.0, 95960.0, 18594.0, 6291.0, 2668.0, 1391.0, 767.0, 406.0, 256.0, 186.0, 124.0, 96.0, 54.0, 37.0, 33.0, 18.0, 15.0, 18.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 3.0], "bins": [-88.25, -86.01318359375, -83.7763671875, -81.53955078125, -79.302734375, -77.06591796875, -74.8291015625, -72.59228515625, -70.35546875, -68.11865234375, -65.8818359375, -63.64501953125, -61.408203125, -59.17138671875, -56.9345703125, -54.69775390625, -52.4609375, -50.22412109375, -47.9873046875, -45.75048828125, -43.513671875, -41.27685546875, -39.0400390625, -36.80322265625, -34.56640625, -32.32958984375, -30.0927734375, -27.85595703125, -25.619140625, -23.38232421875, -21.1455078125, -18.90869140625, -16.671875, -14.43505859375, -12.1982421875, -9.96142578125, -7.724609375, -5.48779296875, -3.2509765625, -1.01416015625, 1.22265625, 3.45947265625, 5.6962890625, 7.93310546875, 10.169921875, 12.40673828125, 14.6435546875, 16.88037109375, 19.1171875, 21.35400390625, 23.5908203125, 25.82763671875, 28.064453125, 30.30126953125, 32.5380859375, 34.77490234375, 37.01171875, 39.24853515625, 41.4853515625, 43.72216796875, 45.958984375, 48.19580078125, 50.4326171875, 52.66943359375, 54.90625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 5.0, 9.0, 23.0, 26.0, 34.0, 77.0, 227.0, 3019.0, 406.0, 96.0, 60.0, 33.0, 10.0, 10.0, 4.0, 11.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.671875, -20.09228515625, -19.5126953125, -18.93310546875, -18.353515625, -17.77392578125, -17.1943359375, -16.61474609375, -16.03515625, -15.45556640625, -14.8759765625, -14.29638671875, -13.716796875, -13.13720703125, -12.5576171875, -11.97802734375, -11.3984375, -10.81884765625, -10.2392578125, -9.65966796875, -9.080078125, -8.50048828125, -7.9208984375, -7.34130859375, -6.76171875, -6.18212890625, -5.6025390625, -5.02294921875, -4.443359375, -3.86376953125, -3.2841796875, -2.70458984375, -2.125, -1.54541015625, -0.9658203125, -0.38623046875, 0.193359375, 0.77294921875, 1.3525390625, 1.93212890625, 2.51171875, 3.09130859375, 3.6708984375, 4.25048828125, 4.830078125, 5.40966796875, 5.9892578125, 6.56884765625, 7.1484375, 7.72802734375, 8.3076171875, 8.88720703125, 9.466796875, 10.04638671875, 10.6259765625, 11.20556640625, 11.78515625, 12.36474609375, 12.9443359375, 13.52392578125, 14.103515625, 14.68310546875, 15.2626953125, 15.84228515625, 16.421875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 3.0, 7.0, 14.0, 22.0, 44.0, 49.0, 81.0, 87.0, 121.0, 125.0, 128.0, 101.0, 80.0, 44.0, 30.0, 14.0, 16.0, 10.0, 3.0, 11.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.79011535644531, -91.06727600097656, -88.34444427490234, -85.62161254882812, -82.89877319335938, -80.17593383789062, -77.4531021118164, -74.73027038574219, -72.00743103027344, -69.28459167480469, -66.56175994873047, -63.838924407958984, -61.1160888671875, -58.393253326416016, -55.67041778564453, -52.94758224487305, -50.22474670410156, -47.50191116333008, -44.779075622558594, -42.05624008178711, -39.333404541015625, -36.61056900024414, -33.887733459472656, -31.164897918701172, -28.442062377929688, -25.719226837158203, -22.99639129638672, -20.273555755615234, -17.55072021484375, -14.827884674072266, -12.105049133300781, -9.382213592529297, -6.6593780517578125, -3.936542510986328, -1.2137069702148438, 1.5091285705566406, 4.231964111328125, 6.954799652099609, 9.677635192871094, 12.400470733642578, 15.123306274414062, 17.846141815185547, 20.56897735595703, 23.291812896728516, 26.0146484375, 28.737483978271484, 31.46031951904297, 34.18315505981445, 36.90599060058594, 39.62882614135742, 42.351661682128906, 45.07449722290039, 47.797332763671875, 50.52016830444336, 53.243003845214844, 55.96583938598633, 58.68867492675781, 61.4115104675293, 64.13434600830078, 66.857177734375, 69.58001708984375, 72.3028564453125, 75.02568817138672, 77.74851989746094, 80.47135925292969]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 11.0, 14.0, 18.0, 13.0, 14.0, 18.0, 23.0, 24.0, 25.0, 21.0, 42.0, 32.0, 38.0, 40.0, 25.0, 57.0, 50.0, 36.0, 45.0, 44.0, 45.0, 46.0, 32.0, 32.0, 28.0, 31.0, 26.0, 14.0, 26.0, 21.0, 21.0, 12.0, 7.0, 12.0, 7.0, 8.0, 5.0, 4.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-39.73627853393555, -38.607452392578125, -37.47863006591797, -36.34980392456055, -35.220977783203125, -34.09215545654297, -32.96332931518555, -31.834505081176758, -30.70568084716797, -29.57685661315918, -28.44803237915039, -27.31920623779297, -26.19038200378418, -25.06155776977539, -23.93273162841797, -22.80390739440918, -21.67508316040039, -20.5462589263916, -19.417434692382812, -18.28860855102539, -17.1597843170166, -16.030960083007812, -14.902134895324707, -13.773309707641602, -12.644485473632812, -11.515661239624023, -10.386836051940918, -9.258010864257812, -8.129186630249023, -7.000361919403076, -5.871537208557129, -4.742712497711182, -3.6138916015625, -2.4850668907165527, -1.3562421798706055, -0.2274174690246582, 0.9014072418212891, 2.0302319526672363, 3.1590566635131836, 4.287881374359131, 5.416706085205078, 6.545530796051025, 7.674355506896973, 8.803180694580078, 9.932004928588867, 11.060829162597656, 12.189654350280762, 13.318479537963867, 14.447303771972656, 15.576128005981445, 16.704952239990234, 17.833778381347656, 18.962602615356445, 20.091426849365234, 21.220252990722656, 22.349077224731445, 23.477901458740234, 24.606725692749023, 25.735549926757812, 26.864376068115234, 27.993200302124023, 29.122024536132812, 30.250850677490234, 31.379674911499023, 32.50849914550781]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 6.0, 14.0, 18.0, 27.0, 37.0, 65.0, 93.0, 154.0, 255.0, 475.0, 729.0, 1401.0, 2713.0, 5529.0, 11463.0, 26688.0, 65846.0, 167271.0, 327997.0, 255002.0, 106532.0, 41967.0, 17881.0, 7953.0, 3960.0, 1984.0, 998.0, 611.0, 340.0, 206.0, 121.0, 65.0, 51.0, 36.0, 13.0, 17.0, 8.0, 7.0, 7.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-30.140625, -29.2734375, -28.40625, -27.5390625, -26.671875, -25.8046875, -24.9375, -24.0703125, -23.203125, -22.3359375, -21.46875, -20.6015625, -19.734375, -18.8671875, -18.0, -17.1328125, -16.265625, -15.3984375, -14.53125, -13.6640625, -12.796875, -11.9296875, -11.0625, -10.1953125, -9.328125, -8.4609375, -7.59375, -6.7265625, -5.859375, -4.9921875, -4.125, -3.2578125, -2.390625, -1.5234375, -0.65625, 0.2109375, 1.078125, 1.9453125, 2.8125, 3.6796875, 4.546875, 5.4140625, 6.28125, 7.1484375, 8.015625, 8.8828125, 9.75, 10.6171875, 11.484375, 12.3515625, 13.21875, 14.0859375, 14.953125, 15.8203125, 16.6875, 17.5546875, 18.421875, 19.2890625, 20.15625, 21.0234375, 21.890625, 22.7578125, 23.625, 24.4921875, 25.359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 12.0, 8.0, 10.0, 14.0, 16.0, 28.0, 37.0, 39.0, 34.0, 26.0, 43.0, 68.0, 70.0, 59.0, 59.0, 49.0, 48.0, 62.0, 46.0, 53.0, 39.0, 33.0, 35.0, 24.0, 20.0, 9.0, 14.0, 6.0, 5.0, 10.0, 3.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.375, -17.8966064453125, -17.418212890625, -16.9398193359375, -16.46142578125, -15.9830322265625, -15.504638671875, -15.0262451171875, -14.5478515625, -14.0694580078125, -13.591064453125, -13.1126708984375, -12.63427734375, -12.1558837890625, -11.677490234375, -11.1990966796875, -10.720703125, -10.2423095703125, -9.763916015625, -9.2855224609375, -8.80712890625, -8.3287353515625, -7.850341796875, -7.3719482421875, -6.8935546875, -6.4151611328125, -5.936767578125, -5.4583740234375, -4.97998046875, -4.5015869140625, -4.023193359375, -3.5447998046875, -3.06640625, -2.5880126953125, -2.109619140625, -1.6312255859375, -1.15283203125, -0.6744384765625, -0.196044921875, 0.2823486328125, 0.7607421875, 1.2391357421875, 1.717529296875, 2.1959228515625, 2.67431640625, 3.1527099609375, 3.631103515625, 4.1094970703125, 4.587890625, 5.0662841796875, 5.544677734375, 6.0230712890625, 6.50146484375, 6.9798583984375, 7.458251953125, 7.9366455078125, 8.4150390625, 8.8934326171875, 9.371826171875, 9.8502197265625, 10.32861328125, 10.8070068359375, 11.285400390625, 11.7637939453125, 12.2421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 10.0, 16.0, 19.0, 38.0, 50.0, 84.0, 134.0, 275.0, 563.0, 1357.0, 5543.0, 83427.0, 888916.0, 60901.0, 4823.0, 1254.0, 510.0, 265.0, 142.0, 91.0, 43.0, 23.0, 19.0, 12.0, 7.0, 5.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-112.25, -108.9921875, -105.734375, -102.4765625, -99.21875, -95.9609375, -92.703125, -89.4453125, -86.1875, -82.9296875, -79.671875, -76.4140625, -73.15625, -69.8984375, -66.640625, -63.3828125, -60.125, -56.8671875, -53.609375, -50.3515625, -47.09375, -43.8359375, -40.578125, -37.3203125, -34.0625, -30.8046875, -27.546875, -24.2890625, -21.03125, -17.7734375, -14.515625, -11.2578125, -8.0, -4.7421875, -1.484375, 1.7734375, 5.03125, 8.2890625, 11.546875, 14.8046875, 18.0625, 21.3203125, 24.578125, 27.8359375, 31.09375, 34.3515625, 37.609375, 40.8671875, 44.125, 47.3828125, 50.640625, 53.8984375, 57.15625, 60.4140625, 63.671875, 66.9296875, 70.1875, 73.4453125, 76.703125, 79.9609375, 83.21875, 86.4765625, 89.734375, 92.9921875, 96.25]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 5.0, 9.0, 14.0, 13.0, 22.0, 22.0, 15.0, 27.0, 25.0, 30.0, 30.0, 35.0, 36.0, 45.0, 31.0, 32.0, 38.0, 52.0, 50.0, 45.0, 59.0, 40.0, 33.0, 40.0, 31.0, 28.0, 28.0, 29.0, 18.0, 19.0, 22.0, 13.0, 10.0, 7.0, 5.0, 7.0, 4.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.90625, -56.07763671875, -54.2490234375, -52.42041015625, -50.591796875, -48.76318359375, -46.9345703125, -45.10595703125, -43.27734375, -41.44873046875, -39.6201171875, -37.79150390625, -35.962890625, -34.13427734375, -32.3056640625, -30.47705078125, -28.6484375, -26.81982421875, -24.9912109375, -23.16259765625, -21.333984375, -19.50537109375, -17.6767578125, -15.84814453125, -14.01953125, -12.19091796875, -10.3623046875, -8.53369140625, -6.705078125, -4.87646484375, -3.0478515625, -1.21923828125, 0.609375, 2.43798828125, 4.2666015625, 6.09521484375, 7.923828125, 9.75244140625, 11.5810546875, 13.40966796875, 15.23828125, 17.06689453125, 18.8955078125, 20.72412109375, 22.552734375, 24.38134765625, 26.2099609375, 28.03857421875, 29.8671875, 31.69580078125, 33.5244140625, 35.35302734375, 37.181640625, 39.01025390625, 40.8388671875, 42.66748046875, 44.49609375, 46.32470703125, 48.1533203125, 49.98193359375, 51.810546875, 53.63916015625, 55.4677734375, 57.29638671875, 59.125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 7.0, 11.0, 18.0, 28.0, 27.0, 47.0, 74.0, 103.0, 159.0, 264.0, 497.0, 916.0, 1983.0, 5616.0, 24123.0, 221481.0, 684567.0, 89024.0, 12948.0, 3530.0, 1365.0, 686.0, 376.0, 253.0, 127.0, 93.0, 72.0, 44.0, 30.0, 23.0, 17.0, 8.0, 8.0, 9.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.5625, -31.48828125, -30.4140625, -29.33984375, -28.265625, -27.19140625, -26.1171875, -25.04296875, -23.96875, -22.89453125, -21.8203125, -20.74609375, -19.671875, -18.59765625, -17.5234375, -16.44921875, -15.375, -14.30078125, -13.2265625, -12.15234375, -11.078125, -10.00390625, -8.9296875, -7.85546875, -6.78125, -5.70703125, -4.6328125, -3.55859375, -2.484375, -1.41015625, -0.3359375, 0.73828125, 1.8125, 2.88671875, 3.9609375, 5.03515625, 6.109375, 7.18359375, 8.2578125, 9.33203125, 10.40625, 11.48046875, 12.5546875, 13.62890625, 14.703125, 15.77734375, 16.8515625, 17.92578125, 19.0, 20.07421875, 21.1484375, 22.22265625, 23.296875, 24.37109375, 25.4453125, 26.51953125, 27.59375, 28.66796875, 29.7421875, 30.81640625, 31.890625, 32.96484375, 34.0390625, 35.11328125, 36.1875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 10.0, 7.0, 8.0, 12.0, 7.0, 15.0, 20.0, 31.0, 39.0, 66.0, 70.0, 84.0, 121.0, 104.0, 102.0, 74.0, 59.0, 55.0, 34.0, 22.0, 16.0, 13.0, 8.0, 6.0, 3.0, 10.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.006134033203125, -0.005959868431091309, -0.005785703659057617, -0.005611538887023926, -0.005437374114990234, -0.005263209342956543, -0.0050890445709228516, -0.00491487979888916, -0.004740715026855469, -0.004566550254821777, -0.004392385482788086, -0.0042182207107543945, -0.004044055938720703, -0.0038698911666870117, -0.0036957263946533203, -0.003521561622619629, -0.0033473968505859375, -0.003173232078552246, -0.0029990673065185547, -0.0028249025344848633, -0.002650737762451172, -0.0024765729904174805, -0.002302408218383789, -0.0021282434463500977, -0.0019540786743164062, -0.0017799139022827148, -0.0016057491302490234, -0.001431584358215332, -0.0012574195861816406, -0.0010832548141479492, -0.0009090900421142578, -0.0007349252700805664, -0.000560760498046875, -0.0003865957260131836, -0.0002124309539794922, -3.826618194580078e-05, 0.00013589859008789062, 0.00031006336212158203, 0.00048422813415527344, 0.0006583929061889648, 0.0008325576782226562, 0.0010067224502563477, 0.001180887222290039, 0.0013550519943237305, 0.0015292167663574219, 0.0017033815383911133, 0.0018775463104248047, 0.002051711082458496, 0.0022258758544921875, 0.002400040626525879, 0.0025742053985595703, 0.0027483701705932617, 0.002922534942626953, 0.0030966997146606445, 0.003270864486694336, 0.0034450292587280273, 0.0036191940307617188, 0.00379335880279541, 0.0039675235748291016, 0.004141688346862793, 0.004315853118896484, 0.004490017890930176, 0.004664182662963867, 0.004838347434997559, 0.00501251220703125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 9.0, 16.0, 18.0, 29.0, 73.0, 104.0, 207.0, 516.0, 1546.0, 7066.0, 109248.0, 879628.0, 43579.0, 4497.0, 1198.0, 379.0, 195.0, 95.0, 61.0, 33.0, 16.0, 15.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.125, -49.1865234375, -47.248046875, -45.3095703125, -43.37109375, -41.4326171875, -39.494140625, -37.5556640625, -35.6171875, -33.6787109375, -31.740234375, -29.8017578125, -27.86328125, -25.9248046875, -23.986328125, -22.0478515625, -20.109375, -18.1708984375, -16.232421875, -14.2939453125, -12.35546875, -10.4169921875, -8.478515625, -6.5400390625, -4.6015625, -2.6630859375, -0.724609375, 1.2138671875, 3.15234375, 5.0908203125, 7.029296875, 8.9677734375, 10.90625, 12.8447265625, 14.783203125, 16.7216796875, 18.66015625, 20.5986328125, 22.537109375, 24.4755859375, 26.4140625, 28.3525390625, 30.291015625, 32.2294921875, 34.16796875, 36.1064453125, 38.044921875, 39.9833984375, 41.921875, 43.8603515625, 45.798828125, 47.7373046875, 49.67578125, 51.6142578125, 53.552734375, 55.4912109375, 57.4296875, 59.3681640625, 61.306640625, 63.2451171875, 65.18359375, 67.1220703125, 69.060546875, 70.9990234375, 72.9375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 15.0, 18.0, 26.0, 55.0, 62.0, 91.0, 107.0, 145.0, 130.0, 80.0, 89.0, 59.0, 38.0, 26.0, 13.0, 12.0, 5.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-49.65625, -48.439208984375, -47.22216796875, -46.005126953125, -44.7880859375, -43.571044921875, -42.35400390625, -41.136962890625, -39.919921875, -38.702880859375, -37.48583984375, -36.268798828125, -35.0517578125, -33.834716796875, -32.61767578125, -31.400634765625, -30.18359375, -28.966552734375, -27.74951171875, -26.532470703125, -25.3154296875, -24.098388671875, -22.88134765625, -21.664306640625, -20.447265625, -19.230224609375, -18.01318359375, -16.796142578125, -15.5791015625, -14.362060546875, -13.14501953125, -11.927978515625, -10.7109375, -9.493896484375, -8.27685546875, -7.059814453125, -5.8427734375, -4.625732421875, -3.40869140625, -2.191650390625, -0.974609375, 0.242431640625, 1.45947265625, 2.676513671875, 3.8935546875, 5.110595703125, 6.32763671875, 7.544677734375, 8.76171875, 9.978759765625, 11.19580078125, 12.412841796875, 13.6298828125, 14.846923828125, 16.06396484375, 17.281005859375, 18.498046875, 19.715087890625, 20.93212890625, 22.149169921875, 23.3662109375, 24.583251953125, 25.80029296875, 27.017333984375, 28.234375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 16.0, 41.0, 71.0, 84.0, 133.0, 151.0, 149.0, 139.0, 93.0, 58.0, 24.0, 18.0, 9.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-848.6618041992188, -831.5957641601562, -814.5296630859375, -797.463623046875, -780.3975830078125, -763.33154296875, -746.2654418945312, -729.1994018554688, -712.13330078125, -695.0672607421875, -678.0011596679688, -660.9351196289062, -643.8690795898438, -626.802978515625, -609.7369384765625, -592.6708984375, -575.6048583984375, -558.538818359375, -541.4727172851562, -524.4066772460938, -507.34063720703125, -490.2745666503906, -473.20849609375, -456.1424560546875, -439.0763854980469, -422.01031494140625, -404.94427490234375, -387.8782043457031, -370.8121337890625, -353.74609375, -336.6800231933594, -319.61395263671875, -302.54791259765625, -285.4818420410156, -268.4158020019531, -251.3497314453125, -234.28367614746094, -217.21762084960938, -200.15155029296875, -183.0854949951172, -166.01942443847656, -148.953369140625, -131.88729858398438, -114.82124328613281, -97.75518798828125, -80.68913269042969, -63.623069763183594, -46.5570068359375, -29.490951538085938, -12.42489242553711, 4.641166687011719, 21.707225799560547, 38.773284912109375, 55.83934020996094, 72.90540313720703, 89.97146606445312, 107.03752136230469, 124.10357666015625, 141.16964721679688, 158.23570251464844, 175.3017578125, 192.36781311035156, 209.43386840820312, 226.49993896484375, 243.5659942626953]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 8.0, 6.0, 3.0, 11.0, 9.0, 18.0, 22.0, 17.0, 29.0, 30.0, 33.0, 54.0, 56.0, 46.0, 54.0, 59.0, 64.0, 71.0, 55.0, 58.0, 50.0, 50.0, 43.0, 26.0, 21.0, 25.0, 15.0, 18.0, 19.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-317.2839050292969, -305.4145202636719, -293.54510498046875, -281.67572021484375, -269.80633544921875, -257.9369201660156, -246.06753540039062, -234.19813537597656, -222.3287353515625, -210.45933532714844, -198.58993530273438, -186.72055053710938, -174.8511505126953, -162.98175048828125, -151.11236572265625, -139.2429656982422, -127.37356567382812, -115.50416564941406, -103.63477325439453, -91.765380859375, -79.89598083496094, -68.02658081054688, -56.157188415527344, -44.28779602050781, -32.41839599609375, -20.548999786376953, -8.679603576660156, 3.1897926330566406, 15.059188842773438, 26.928585052490234, 38.79798126220703, 50.66737365722656, 62.5367431640625, 74.40614318847656, 86.2755355834961, 98.14492797851562, 110.01432800292969, 121.88372802734375, 133.75311279296875, 145.6225128173828, 157.49191284179688, 169.36131286621094, 181.230712890625, 193.10009765625, 204.96949768066406, 216.83889770507812, 228.70828247070312, 240.5776824951172, 252.44708251953125, 264.31646728515625, 276.1858825683594, 288.0552673339844, 299.9246826171875, 311.7940673828125, 323.6634521484375, 335.5328369140625, 347.4022521972656, 359.2716369628906, 371.14105224609375, 383.01043701171875, 394.87982177734375, 406.7492370605469, 418.6186218261719, 430.488037109375, 442.357421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 6.0, 12.0, 17.0, 15.0, 23.0, 34.0, 46.0, 64.0, 82.0, 138.0, 150.0, 282.0, 461.0, 725.0, 1305.0, 2704.0, 6540.0, 22066.0, 3702914.0, 424813.0, 20065.0, 6030.0, 2538.0, 1249.0, 739.0, 424.0, 235.0, 180.0, 109.0, 76.0, 50.0, 47.0, 33.0, 24.0, 16.0, 16.0, 9.0, 10.0, 5.0, 10.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-66.3125, -64.23828125, -62.1640625, -60.08984375, -58.015625, -55.94140625, -53.8671875, -51.79296875, -49.71875, -47.64453125, -45.5703125, -43.49609375, -41.421875, -39.34765625, -37.2734375, -35.19921875, -33.125, -31.05078125, -28.9765625, -26.90234375, -24.828125, -22.75390625, -20.6796875, -18.60546875, -16.53125, -14.45703125, -12.3828125, -10.30859375, -8.234375, -6.16015625, -4.0859375, -2.01171875, 0.0625, 2.13671875, 4.2109375, 6.28515625, 8.359375, 10.43359375, 12.5078125, 14.58203125, 16.65625, 18.73046875, 20.8046875, 22.87890625, 24.953125, 27.02734375, 29.1015625, 31.17578125, 33.25, 35.32421875, 37.3984375, 39.47265625, 41.546875, 43.62109375, 45.6953125, 47.76953125, 49.84375, 51.91796875, 53.9921875, 56.06640625, 58.140625, 60.21484375, 62.2890625, 64.36328125, 66.4375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 10.0, 9.0, 10.0, 12.0, 13.0, 25.0, 31.0, 32.0, 56.0, 40.0, 66.0, 62.0, 83.0, 52.0, 77.0, 66.0, 63.0, 53.0, 44.0, 44.0, 38.0, 33.0, 21.0, 14.0, 11.0, 11.0, 4.0, 9.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.734375, -20.13916015625, -19.5439453125, -18.94873046875, -18.353515625, -17.75830078125, -17.1630859375, -16.56787109375, -15.97265625, -15.37744140625, -14.7822265625, -14.18701171875, -13.591796875, -12.99658203125, -12.4013671875, -11.80615234375, -11.2109375, -10.61572265625, -10.0205078125, -9.42529296875, -8.830078125, -8.23486328125, -7.6396484375, -7.04443359375, -6.44921875, -5.85400390625, -5.2587890625, -4.66357421875, -4.068359375, -3.47314453125, -2.8779296875, -2.28271484375, -1.6875, -1.09228515625, -0.4970703125, 0.09814453125, 0.693359375, 1.28857421875, 1.8837890625, 2.47900390625, 3.07421875, 3.66943359375, 4.2646484375, 4.85986328125, 5.455078125, 6.05029296875, 6.6455078125, 7.24072265625, 7.8359375, 8.43115234375, 9.0263671875, 9.62158203125, 10.216796875, 10.81201171875, 11.4072265625, 12.00244140625, 12.59765625, 13.19287109375, 13.7880859375, 14.38330078125, 14.978515625, 15.57373046875, 16.1689453125, 16.76416015625, 17.359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 8.0, 9.0, 16.0, 17.0, 36.0, 28.0, 42.0, 84.0, 118.0, 168.0, 265.0, 396.0, 651.0, 1199.0, 2515.0, 6322.0, 26277.0, 4037331.0, 100132.0, 10851.0, 3691.0, 1736.0, 883.0, 498.0, 327.0, 208.0, 127.0, 112.0, 67.0, 53.0, 33.0, 31.0, 11.0, 8.0, 11.0, 4.0, 6.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-118.5, -115.359375, -112.21875, -109.078125, -105.9375, -102.796875, -99.65625, -96.515625, -93.375, -90.234375, -87.09375, -83.953125, -80.8125, -77.671875, -74.53125, -71.390625, -68.25, -65.109375, -61.96875, -58.828125, -55.6875, -52.546875, -49.40625, -46.265625, -43.125, -39.984375, -36.84375, -33.703125, -30.5625, -27.421875, -24.28125, -21.140625, -18.0, -14.859375, -11.71875, -8.578125, -5.4375, -2.296875, 0.84375, 3.984375, 7.125, 10.265625, 13.40625, 16.546875, 19.6875, 22.828125, 25.96875, 29.109375, 32.25, 35.390625, 38.53125, 41.671875, 44.8125, 47.953125, 51.09375, 54.234375, 57.375, 60.515625, 63.65625, 66.796875, 69.9375, 73.078125, 76.21875, 79.359375, 82.5]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 12.0, 29.0, 59.0, 191.0, 3456.0, 188.0, 55.0, 19.0, 15.0, 8.0, 4.0, 2.0, 2.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-25.75, -25.097412109375, -24.44482421875, -23.792236328125, -23.1396484375, -22.487060546875, -21.83447265625, -21.181884765625, -20.529296875, -19.876708984375, -19.22412109375, -18.571533203125, -17.9189453125, -17.266357421875, -16.61376953125, -15.961181640625, -15.30859375, -14.656005859375, -14.00341796875, -13.350830078125, -12.6982421875, -12.045654296875, -11.39306640625, -10.740478515625, -10.087890625, -9.435302734375, -8.78271484375, -8.130126953125, -7.4775390625, -6.824951171875, -6.17236328125, -5.519775390625, -4.8671875, -4.214599609375, -3.56201171875, -2.909423828125, -2.2568359375, -1.604248046875, -0.95166015625, -0.299072265625, 0.353515625, 1.006103515625, 1.65869140625, 2.311279296875, 2.9638671875, 3.616455078125, 4.26904296875, 4.921630859375, 5.57421875, 6.226806640625, 6.87939453125, 7.531982421875, 8.1845703125, 8.837158203125, 9.48974609375, 10.142333984375, 10.794921875, 11.447509765625, 12.10009765625, 12.752685546875, 13.4052734375, 14.057861328125, 14.71044921875, 15.363037109375, 16.015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 8.0, 9.0, 11.0, 19.0, 25.0, 38.0, 74.0, 94.0, 147.0, 159.0, 115.0, 99.0, 71.0, 39.0, 29.0, 17.0, 14.0, 10.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.260986328125, -81.47915649414062, -78.69731903076172, -75.91548919677734, -73.13365173339844, -70.35182189941406, -67.56998443603516, -64.78815460205078, -62.006317138671875, -59.224483489990234, -56.442649841308594, -53.66081619262695, -50.87898254394531, -48.09714889526367, -45.31531524658203, -42.533485412597656, -39.751651763916016, -36.969818115234375, -34.187984466552734, -31.406150817871094, -28.624317169189453, -25.842483520507812, -23.060651779174805, -20.278818130493164, -17.496984481811523, -14.715150833129883, -11.933317184448242, -9.151484489440918, -6.369650840759277, -3.5878171920776367, -0.8059844970703125, 1.9758491516113281, 4.757682800292969, 7.539516448974609, 10.32135009765625, 13.103182792663574, 15.885016441345215, 18.666851043701172, 21.44868278503418, 24.23051643371582, 27.01235008239746, 29.7941837310791, 32.57601547241211, 35.35784912109375, 38.13968276977539, 40.92151641845703, 43.70335006713867, 46.48518371582031, 49.26701736450195, 52.048851013183594, 54.830684661865234, 57.612518310546875, 60.394351959228516, 63.176185607910156, 65.95801544189453, 68.73985290527344, 71.52168273925781, 74.30351257324219, 77.0853500366211, 79.86717987060547, 82.64901733398438, 85.43084716796875, 88.21268463134766, 90.99451446533203, 93.77635192871094]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 3.0, 5.0, 6.0, 11.0, 9.0, 13.0, 10.0, 14.0, 20.0, 22.0, 24.0, 31.0, 26.0, 27.0, 39.0, 31.0, 40.0, 43.0, 44.0, 38.0, 46.0, 46.0, 31.0, 36.0, 39.0, 43.0, 33.0, 28.0, 34.0, 32.0, 30.0, 18.0, 17.0, 18.0, 20.0, 12.0, 15.0, 5.0, 7.0, 5.0, 2.0, 6.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.69208526611328, -32.61668014526367, -31.541275024414062, -30.46586799621582, -29.39046287536621, -28.3150577545166, -27.23965072631836, -26.16424560546875, -25.08884048461914, -24.01343536376953, -22.938030242919922, -21.86262321472168, -20.78721809387207, -19.71181297302246, -18.63640594482422, -17.56100082397461, -16.485595703125, -15.41019058227539, -14.334784507751465, -13.259378433227539, -12.18397331237793, -11.10856819152832, -10.033162117004395, -8.957756042480469, -7.882350921630859, -6.806945323944092, -5.731539726257324, -4.656134128570557, -3.580728530883789, -2.5053229331970215, -1.429917335510254, -0.35451173782348633, 0.7208976745605469, 1.7963032722473145, 2.871708869934082, 3.9471144676208496, 5.022520065307617, 6.097925662994385, 7.173331260681152, 8.248737335205078, 9.324142456054688, 10.399547576904297, 11.474953651428223, 12.550359725952148, 13.625764846801758, 14.701169967651367, 15.776576042175293, 16.85198211669922, 17.927387237548828, 19.002792358398438, 20.078197479248047, 21.15360450744629, 22.2290096282959, 23.304414749145508, 24.37982177734375, 25.45522689819336, 26.53063201904297, 27.606037139892578, 28.681442260742188, 29.75684928894043, 30.83225440979004, 31.90765953063965, 32.98306655883789, 34.0584716796875, 35.13387680053711]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 4.0, 8.0, 11.0, 13.0, 30.0, 36.0, 60.0, 81.0, 101.0, 157.0, 240.0, 323.0, 580.0, 1008.0, 1800.0, 3399.0, 6755.0, 13697.0, 28768.0, 61207.0, 136281.0, 292575.0, 271014.0, 122970.0, 55018.0, 26163.0, 12604.0, 6339.0, 3168.0, 1720.0, 942.0, 518.0, 333.0, 184.0, 138.0, 87.0, 67.0, 36.0, 34.0, 15.0, 15.0, 17.0, 11.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0], "bins": [-27.671875, -26.90185546875, -26.1318359375, -25.36181640625, -24.591796875, -23.82177734375, -23.0517578125, -22.28173828125, -21.51171875, -20.74169921875, -19.9716796875, -19.20166015625, -18.431640625, -17.66162109375, -16.8916015625, -16.12158203125, -15.3515625, -14.58154296875, -13.8115234375, -13.04150390625, -12.271484375, -11.50146484375, -10.7314453125, -9.96142578125, -9.19140625, -8.42138671875, -7.6513671875, -6.88134765625, -6.111328125, -5.34130859375, -4.5712890625, -3.80126953125, -3.03125, -2.26123046875, -1.4912109375, -0.72119140625, 0.048828125, 0.81884765625, 1.5888671875, 2.35888671875, 3.12890625, 3.89892578125, 4.6689453125, 5.43896484375, 6.208984375, 6.97900390625, 7.7490234375, 8.51904296875, 9.2890625, 10.05908203125, 10.8291015625, 11.59912109375, 12.369140625, 13.13916015625, 13.9091796875, 14.67919921875, 15.44921875, 16.21923828125, 16.9892578125, 17.75927734375, 18.529296875, 19.29931640625, 20.0693359375, 20.83935546875, 21.609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 6.0, 1.0, 8.0, 14.0, 6.0, 13.0, 23.0, 22.0, 37.0, 36.0, 45.0, 42.0, 46.0, 47.0, 58.0, 66.0, 72.0, 60.0, 62.0, 61.0, 42.0, 39.0, 33.0, 36.0, 26.0, 22.0, 13.0, 11.0, 7.0, 11.0, 9.0, 8.0, 5.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.6875, -19.09423828125, -18.5009765625, -17.90771484375, -17.314453125, -16.72119140625, -16.1279296875, -15.53466796875, -14.94140625, -14.34814453125, -13.7548828125, -13.16162109375, -12.568359375, -11.97509765625, -11.3818359375, -10.78857421875, -10.1953125, -9.60205078125, -9.0087890625, -8.41552734375, -7.822265625, -7.22900390625, -6.6357421875, -6.04248046875, -5.44921875, -4.85595703125, -4.2626953125, -3.66943359375, -3.076171875, -2.48291015625, -1.8896484375, -1.29638671875, -0.703125, -0.10986328125, 0.4833984375, 1.07666015625, 1.669921875, 2.26318359375, 2.8564453125, 3.44970703125, 4.04296875, 4.63623046875, 5.2294921875, 5.82275390625, 6.416015625, 7.00927734375, 7.6025390625, 8.19580078125, 8.7890625, 9.38232421875, 9.9755859375, 10.56884765625, 11.162109375, 11.75537109375, 12.3486328125, 12.94189453125, 13.53515625, 14.12841796875, 14.7216796875, 15.31494140625, 15.908203125, 16.50146484375, 17.0947265625, 17.68798828125, 18.28125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 3.0, 9.0, 11.0, 10.0, 15.0, 20.0, 34.0, 48.0, 69.0, 111.0, 172.0, 294.0, 590.0, 1359.0, 4128.0, 34629.0, 792113.0, 199465.0, 11292.0, 2273.0, 831.0, 413.0, 208.0, 129.0, 93.0, 63.0, 36.0, 33.0, 27.0, 19.0, 12.0, 7.0, 6.0, 4.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.125, -79.4560546875, -76.787109375, -74.1181640625, -71.44921875, -68.7802734375, -66.111328125, -63.4423828125, -60.7734375, -58.1044921875, -55.435546875, -52.7666015625, -50.09765625, -47.4287109375, -44.759765625, -42.0908203125, -39.421875, -36.7529296875, -34.083984375, -31.4150390625, -28.74609375, -26.0771484375, -23.408203125, -20.7392578125, -18.0703125, -15.4013671875, -12.732421875, -10.0634765625, -7.39453125, -4.7255859375, -2.056640625, 0.6123046875, 3.28125, 5.9501953125, 8.619140625, 11.2880859375, 13.95703125, 16.6259765625, 19.294921875, 21.9638671875, 24.6328125, 27.3017578125, 29.970703125, 32.6396484375, 35.30859375, 37.9775390625, 40.646484375, 43.3154296875, 45.984375, 48.6533203125, 51.322265625, 53.9912109375, 56.66015625, 59.3291015625, 61.998046875, 64.6669921875, 67.3359375, 70.0048828125, 72.673828125, 75.3427734375, 78.01171875, 80.6806640625, 83.349609375, 86.0185546875, 88.6875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 5.0, 0.0, 7.0, 11.0, 11.0, 12.0, 18.0, 18.0, 16.0, 17.0, 24.0, 17.0, 22.0, 34.0, 34.0, 46.0, 34.0, 44.0, 30.0, 49.0, 28.0, 35.0, 47.0, 41.0, 44.0, 42.0, 35.0, 27.0, 32.0, 38.0, 27.0, 17.0, 28.0, 16.0, 11.0, 17.0, 9.0, 16.0, 5.0, 8.0, 8.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.96875, -58.10595703125, -56.2431640625, -54.38037109375, -52.517578125, -50.65478515625, -48.7919921875, -46.92919921875, -45.06640625, -43.20361328125, -41.3408203125, -39.47802734375, -37.615234375, -35.75244140625, -33.8896484375, -32.02685546875, -30.1640625, -28.30126953125, -26.4384765625, -24.57568359375, -22.712890625, -20.85009765625, -18.9873046875, -17.12451171875, -15.26171875, -13.39892578125, -11.5361328125, -9.67333984375, -7.810546875, -5.94775390625, -4.0849609375, -2.22216796875, -0.359375, 1.50341796875, 3.3662109375, 5.22900390625, 7.091796875, 8.95458984375, 10.8173828125, 12.68017578125, 14.54296875, 16.40576171875, 18.2685546875, 20.13134765625, 21.994140625, 23.85693359375, 25.7197265625, 27.58251953125, 29.4453125, 31.30810546875, 33.1708984375, 35.03369140625, 36.896484375, 38.75927734375, 40.6220703125, 42.48486328125, 44.34765625, 46.21044921875, 48.0732421875, 49.93603515625, 51.798828125, 53.66162109375, 55.5244140625, 57.38720703125, 59.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 3.0, 3.0, 8.0, 15.0, 11.0, 33.0, 40.0, 97.0, 125.0, 251.0, 500.0, 1311.0, 3811.0, 16638.0, 150796.0, 776551.0, 82179.0, 11213.0, 2951.0, 1027.0, 453.0, 217.0, 126.0, 65.0, 40.0, 26.0, 18.0, 15.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.625, -34.52490234375, -33.4248046875, -32.32470703125, -31.224609375, -30.12451171875, -29.0244140625, -27.92431640625, -26.82421875, -25.72412109375, -24.6240234375, -23.52392578125, -22.423828125, -21.32373046875, -20.2236328125, -19.12353515625, -18.0234375, -16.92333984375, -15.8232421875, -14.72314453125, -13.623046875, -12.52294921875, -11.4228515625, -10.32275390625, -9.22265625, -8.12255859375, -7.0224609375, -5.92236328125, -4.822265625, -3.72216796875, -2.6220703125, -1.52197265625, -0.421875, 0.67822265625, 1.7783203125, 2.87841796875, 3.978515625, 5.07861328125, 6.1787109375, 7.27880859375, 8.37890625, 9.47900390625, 10.5791015625, 11.67919921875, 12.779296875, 13.87939453125, 14.9794921875, 16.07958984375, 17.1796875, 18.27978515625, 19.3798828125, 20.47998046875, 21.580078125, 22.68017578125, 23.7802734375, 24.88037109375, 25.98046875, 27.08056640625, 28.1806640625, 29.28076171875, 30.380859375, 31.48095703125, 32.5810546875, 33.68115234375, 34.78125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 9.0, 5.0, 14.0, 13.0, 22.0, 23.0, 24.0, 47.0, 45.0, 70.0, 94.0, 113.0, 126.0, 90.0, 68.0, 41.0, 38.0, 34.0, 18.0, 19.0, 19.0, 18.0, 7.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00572967529296875, -0.005567014217376709, -0.005404353141784668, -0.005241692066192627, -0.005079030990600586, -0.004916369915008545, -0.004753708839416504, -0.004591047763824463, -0.004428386688232422, -0.004265725612640381, -0.00410306453704834, -0.003940403461456299, -0.003777742385864258, -0.003615081310272217, -0.0034524202346801758, -0.0032897591590881348, -0.0031270980834960938, -0.0029644370079040527, -0.0028017759323120117, -0.0026391148567199707, -0.0024764537811279297, -0.0023137927055358887, -0.0021511316299438477, -0.0019884705543518066, -0.0018258094787597656, -0.0016631484031677246, -0.0015004873275756836, -0.0013378262519836426, -0.0011751651763916016, -0.0010125041007995605, -0.0008498430252075195, -0.0006871819496154785, -0.0005245208740234375, -0.0003618597984313965, -0.00019919872283935547, -3.653764724731445e-05, 0.00012612342834472656, 0.0002887845039367676, 0.0004514455795288086, 0.0006141066551208496, 0.0007767677307128906, 0.0009394288063049316, 0.0011020898818969727, 0.0012647509574890137, 0.0014274120330810547, 0.0015900731086730957, 0.0017527341842651367, 0.0019153952598571777, 0.0020780563354492188, 0.0022407174110412598, 0.0024033784866333008, 0.002566039562225342, 0.002728700637817383, 0.002891361713409424, 0.003054022789001465, 0.003216683864593506, 0.003379344940185547, 0.003542006015777588, 0.003704667091369629, 0.00386732816696167, 0.004029989242553711, 0.004192650318145752, 0.004355311393737793, 0.004517972469329834, 0.004680633544921875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 10.0, 16.0, 20.0, 29.0, 89.0, 139.0, 313.0, 905.0, 3368.0, 27091.0, 730428.0, 270472.0, 12498.0, 2044.0, 612.0, 266.0, 119.0, 55.0, 30.0, 25.0, 10.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.9375, -54.234375, -52.53125, -50.828125, -49.125, -47.421875, -45.71875, -44.015625, -42.3125, -40.609375, -38.90625, -37.203125, -35.5, -33.796875, -32.09375, -30.390625, -28.6875, -26.984375, -25.28125, -23.578125, -21.875, -20.171875, -18.46875, -16.765625, -15.0625, -13.359375, -11.65625, -9.953125, -8.25, -6.546875, -4.84375, -3.140625, -1.4375, 0.265625, 1.96875, 3.671875, 5.375, 7.078125, 8.78125, 10.484375, 12.1875, 13.890625, 15.59375, 17.296875, 19.0, 20.703125, 22.40625, 24.109375, 25.8125, 27.515625, 29.21875, 30.921875, 32.625, 34.328125, 36.03125, 37.734375, 39.4375, 41.140625, 42.84375, 44.546875, 46.25, 47.953125, 49.65625, 51.359375, 53.0625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 1.0, 9.0, 6.0, 18.0, 22.0, 28.0, 34.0, 62.0, 80.0, 93.0, 104.0, 113.0, 91.0, 76.0, 70.0, 63.0, 31.0, 28.0, 15.0, 20.0, 10.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6875, -32.7646484375, -31.841796875, -30.9189453125, -29.99609375, -29.0732421875, -28.150390625, -27.2275390625, -26.3046875, -25.3818359375, -24.458984375, -23.5361328125, -22.61328125, -21.6904296875, -20.767578125, -19.8447265625, -18.921875, -17.9990234375, -17.076171875, -16.1533203125, -15.23046875, -14.3076171875, -13.384765625, -12.4619140625, -11.5390625, -10.6162109375, -9.693359375, -8.7705078125, -7.84765625, -6.9248046875, -6.001953125, -5.0791015625, -4.15625, -3.2333984375, -2.310546875, -1.3876953125, -0.46484375, 0.4580078125, 1.380859375, 2.3037109375, 3.2265625, 4.1494140625, 5.072265625, 5.9951171875, 6.91796875, 7.8408203125, 8.763671875, 9.6865234375, 10.609375, 11.5322265625, 12.455078125, 13.3779296875, 14.30078125, 15.2236328125, 16.146484375, 17.0693359375, 17.9921875, 18.9150390625, 19.837890625, 20.7607421875, 21.68359375, 22.6064453125, 23.529296875, 24.4521484375, 25.375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 10.0, 23.0, 35.0, 55.0, 89.0, 122.0, 144.0, 145.0, 121.0, 91.0, 62.0, 34.0, 20.0, 11.0, 11.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-460.0072326660156, -446.1057434082031, -432.2042541503906, -418.302734375, -404.4012451171875, -390.499755859375, -376.5982666015625, -362.69677734375, -348.7952880859375, -334.893798828125, -320.9923095703125, -307.0908203125, -293.1893005371094, -279.2878112792969, -265.3863220214844, -251.48483276367188, -237.58331298828125, -223.68182373046875, -209.7803192138672, -195.8788299560547, -181.97732543945312, -168.07583618164062, -154.17434692382812, -140.27285766601562, -126.37135314941406, -112.46985626220703, -98.568359375, -84.6668701171875, -70.76537322998047, -56.86387634277344, -42.96238708496094, -29.060890197753906, -15.15936279296875, -1.2578678131103516, 12.643627166748047, 26.545120239257812, 40.446617126464844, 54.348114013671875, 68.24960327148438, 82.1511001586914, 96.05259704589844, 109.95409393310547, 123.8555908203125, 137.757080078125, 151.6585693359375, 165.56007385253906, 179.46156311035156, 193.36306762695312, 207.26455688476562, 221.16604614257812, 235.0675506591797, 248.9690399169922, 262.87054443359375, 276.77203369140625, 290.67352294921875, 304.57501220703125, 318.47650146484375, 332.37799072265625, 346.27947998046875, 360.18096923828125, 374.0824890136719, 387.9839782714844, 401.8854675292969, 415.7869567871094, 429.6884765625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 8.0, 3.0, 6.0, 3.0, 11.0, 8.0, 9.0, 17.0, 19.0, 17.0, 16.0, 24.0, 28.0, 37.0, 37.0, 27.0, 51.0, 38.0, 56.0, 48.0, 55.0, 57.0, 52.0, 42.0, 43.0, 34.0, 35.0, 25.0, 31.0, 28.0, 22.0, 20.0, 22.0, 14.0, 13.0, 11.0, 7.0, 6.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-335.2519836425781, -326.1717224121094, -317.0914611816406, -308.01116943359375, -298.930908203125, -289.85064697265625, -280.7703857421875, -271.69012451171875, -262.6098327636719, -253.52957153320312, -244.4492950439453, -235.36903381347656, -226.28875732421875, -217.20849609375, -208.12823486328125, -199.04795837402344, -189.9676971435547, -180.88743591308594, -171.80715942382812, -162.72689819335938, -153.64662170410156, -144.5663604736328, -135.486083984375, -126.40582275390625, -117.32555389404297, -108.24528503417969, -99.1650161743164, -90.08474731445312, -81.00448608398438, -71.92420959472656, -62.84394836425781, -53.76367950439453, -44.68341064453125, -35.60314178466797, -26.52287483215332, -17.442607879638672, -8.36233901977539, 0.7179298400878906, 9.798194885253906, 18.878463745117188, 27.95873260498047, 37.03900146484375, 46.11927032470703, 55.19953536987305, 64.27980041503906, 73.36007690429688, 82.44033813476562, 91.5206069946289, 100.60087585449219, 109.68114471435547, 118.76141357421875, 127.8416748046875, 136.9219512939453, 146.00221252441406, 155.08248901367188, 164.16275024414062, 173.24301147460938, 182.32327270507812, 191.40354919433594, 200.4838104248047, 209.5640869140625, 218.64434814453125, 227.724609375, 236.8048858642578, 245.88516235351562]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 2.0, 7.0, 7.0, 17.0, 21.0, 25.0, 29.0, 54.0, 50.0, 102.0, 118.0, 163.0, 241.0, 325.0, 451.0, 741.0, 1167.0, 1862.0, 3254.0, 6596.0, 17793.0, 81467.0, 3854889.0, 179252.0, 26709.0, 8896.0, 4009.0, 2137.0, 1262.0, 834.0, 551.0, 375.0, 245.0, 164.0, 133.0, 79.0, 61.0, 50.0, 36.0, 36.0, 23.0, 9.0, 12.0, 11.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.75, -46.2880859375, -44.826171875, -43.3642578125, -41.90234375, -40.4404296875, -38.978515625, -37.5166015625, -36.0546875, -34.5927734375, -33.130859375, -31.6689453125, -30.20703125, -28.7451171875, -27.283203125, -25.8212890625, -24.359375, -22.8974609375, -21.435546875, -19.9736328125, -18.51171875, -17.0498046875, -15.587890625, -14.1259765625, -12.6640625, -11.2021484375, -9.740234375, -8.2783203125, -6.81640625, -5.3544921875, -3.892578125, -2.4306640625, -0.96875, 0.4931640625, 1.955078125, 3.4169921875, 4.87890625, 6.3408203125, 7.802734375, 9.2646484375, 10.7265625, 12.1884765625, 13.650390625, 15.1123046875, 16.57421875, 18.0361328125, 19.498046875, 20.9599609375, 22.421875, 23.8837890625, 25.345703125, 26.8076171875, 28.26953125, 29.7314453125, 31.193359375, 32.6552734375, 34.1171875, 35.5791015625, 37.041015625, 38.5029296875, 39.96484375, 41.4267578125, 42.888671875, 44.3505859375, 45.8125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 10.0, 8.0, 7.0, 20.0, 21.0, 33.0, 33.0, 52.0, 51.0, 80.0, 68.0, 86.0, 81.0, 85.0, 88.0, 67.0, 49.0, 43.0, 25.0, 26.0, 23.0, 14.0, 10.0, 9.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-33.40625, -32.6671142578125, -31.927978515625, -31.1888427734375, -30.44970703125, -29.7105712890625, -28.971435546875, -28.2322998046875, -27.4931640625, -26.7540283203125, -26.014892578125, -25.2757568359375, -24.53662109375, -23.7974853515625, -23.058349609375, -22.3192138671875, -21.580078125, -20.8409423828125, -20.101806640625, -19.3626708984375, -18.62353515625, -17.8843994140625, -17.145263671875, -16.4061279296875, -15.6669921875, -14.9278564453125, -14.188720703125, -13.4495849609375, -12.71044921875, -11.9713134765625, -11.232177734375, -10.4930419921875, -9.75390625, -9.0147705078125, -8.275634765625, -7.5364990234375, -6.79736328125, -6.0582275390625, -5.319091796875, -4.5799560546875, -3.8408203125, -3.1016845703125, -2.362548828125, -1.6234130859375, -0.88427734375, -0.1451416015625, 0.593994140625, 1.3331298828125, 2.072265625, 2.8114013671875, 3.550537109375, 4.2896728515625, 5.02880859375, 5.7679443359375, 6.507080078125, 7.2462158203125, 7.9853515625, 8.7244873046875, 9.463623046875, 10.2027587890625, 10.94189453125, 11.6810302734375, 12.420166015625, 13.1593017578125, 13.8984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 5.0, 18.0, 31.0, 33.0, 50.0, 85.0, 128.0, 229.0, 372.0, 687.0, 1297.0, 2683.0, 6398.0, 18460.0, 100581.0, 3928186.0, 104316.0, 18772.0, 6419.0, 2739.0, 1265.0, 616.0, 352.0, 222.0, 107.0, 91.0, 40.0, 33.0, 24.0, 17.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.1875, -59.041015625, -56.89453125, -54.748046875, -52.6015625, -50.455078125, -48.30859375, -46.162109375, -44.015625, -41.869140625, -39.72265625, -37.576171875, -35.4296875, -33.283203125, -31.13671875, -28.990234375, -26.84375, -24.697265625, -22.55078125, -20.404296875, -18.2578125, -16.111328125, -13.96484375, -11.818359375, -9.671875, -7.525390625, -5.37890625, -3.232421875, -1.0859375, 1.060546875, 3.20703125, 5.353515625, 7.5, 9.646484375, 11.79296875, 13.939453125, 16.0859375, 18.232421875, 20.37890625, 22.525390625, 24.671875, 26.818359375, 28.96484375, 31.111328125, 33.2578125, 35.404296875, 37.55078125, 39.697265625, 41.84375, 43.990234375, 46.13671875, 48.283203125, 50.4296875, 52.576171875, 54.72265625, 56.869140625, 59.015625, 61.162109375, 63.30859375, 65.455078125, 67.6015625, 69.748046875, 71.89453125, 74.041015625, 76.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 6.0, 8.0, 11.0, 16.0, 22.0, 48.0, 62.0, 182.0, 1970.0, 1340.0, 163.0, 92.0, 38.0, 28.0, 19.0, 13.0, 10.0, 7.0, 2.0, 7.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.171875, -23.337890625, -22.50390625, -21.669921875, -20.8359375, -20.001953125, -19.16796875, -18.333984375, -17.5, -16.666015625, -15.83203125, -14.998046875, -14.1640625, -13.330078125, -12.49609375, -11.662109375, -10.828125, -9.994140625, -9.16015625, -8.326171875, -7.4921875, -6.658203125, -5.82421875, -4.990234375, -4.15625, -3.322265625, -2.48828125, -1.654296875, -0.8203125, 0.013671875, 0.84765625, 1.681640625, 2.515625, 3.349609375, 4.18359375, 5.017578125, 5.8515625, 6.685546875, 7.51953125, 8.353515625, 9.1875, 10.021484375, 10.85546875, 11.689453125, 12.5234375, 13.357421875, 14.19140625, 15.025390625, 15.859375, 16.693359375, 17.52734375, 18.361328125, 19.1953125, 20.029296875, 20.86328125, 21.697265625, 22.53125, 23.365234375, 24.19921875, 25.033203125, 25.8671875, 26.701171875, 27.53515625, 28.369140625, 29.203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 14.0, 16.0, 50.0, 89.0, 158.0, 228.0, 195.0, 116.0, 64.0, 32.0, 23.0, 5.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-266.13922119140625, -259.09765625, -252.0561065673828, -245.01454162597656, -237.9729766845703, -230.93142700195312, -223.88986206054688, -216.84829711914062, -209.80673217773438, -202.76516723632812, -195.72361755371094, -188.6820526123047, -181.64048767089844, -174.59893798828125, -167.557373046875, -160.51580810546875, -153.4742431640625, -146.43267822265625, -139.39112854003906, -132.3495635986328, -125.30799865722656, -118.26644134521484, -111.22488403320312, -104.18331909179688, -97.14176940917969, -90.10021209716797, -83.05864715576172, -76.01708984375, -68.97552490234375, -61.93396759033203, -54.89240646362305, -47.85084533691406, -40.80928039550781, -33.76771926879883, -26.726158142089844, -19.684598922729492, -12.643037796020508, -5.601478576660156, 1.4400825500488281, 8.481643676757812, 15.523204803466797, 22.56476593017578, 29.606327056884766, 36.64788818359375, 43.68944549560547, 50.73100662231445, 57.77256774902344, 64.81413269042969, 71.8556900024414, 78.89724731445312, 85.93881225585938, 92.9803695678711, 100.02193450927734, 107.06349182128906, 114.10505676269531, 121.14661407470703, 128.18817138671875, 135.229736328125, 142.2712860107422, 149.31285095214844, 156.3544158935547, 163.39596557617188, 170.43753051757812, 177.47909545898438, 184.52066040039062]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 13.0, 8.0, 11.0, 24.0, 16.0, 21.0, 33.0, 40.0, 47.0, 36.0, 49.0, 50.0, 52.0, 53.0, 41.0, 54.0, 57.0, 46.0, 54.0, 49.0, 42.0, 27.0, 37.0, 31.0, 25.0, 18.0, 12.0, 14.0, 19.0, 8.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.72419738769531, -88.1270523071289, -85.5299072265625, -82.9327621459961, -80.33561706542969, -77.73847198486328, -75.14132690429688, -72.54417419433594, -69.94703674316406, -67.34989166259766, -64.75274658203125, -62.155601501464844, -59.55845642089844, -56.96131134033203, -54.36416244506836, -51.76701736450195, -49.16986846923828, -46.572723388671875, -43.97557830810547, -41.37843322753906, -38.781288146972656, -36.18414306640625, -33.58699417114258, -30.989849090576172, -28.392704010009766, -25.79555892944336, -23.198413848876953, -20.601266860961914, -18.004121780395508, -15.406976699829102, -12.809830665588379, -10.212684631347656, -7.61553955078125, -5.0183939933776855, -2.421248435974121, 0.17589712142944336, 2.773042678833008, 5.370187759399414, 7.967333793640137, 10.56447982788086, 13.161624908447266, 15.758769989013672, 18.355915069580078, 20.953062057495117, 23.550207138061523, 26.14735221862793, 28.74449920654297, 31.341644287109375, 33.93878936767578, 36.53593444824219, 39.133079528808594, 41.730224609375, 44.327369689941406, 46.92451477050781, 49.521663665771484, 52.11880874633789, 54.7159538269043, 57.3130989074707, 59.91024398803711, 62.507389068603516, 65.10453796386719, 67.7016830444336, 70.298828125, 72.8959732055664, 75.49311828613281]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 21.0, 27.0, 31.0, 68.0, 124.0, 232.0, 463.0, 998.0, 2292.0, 6239.0, 17531.0, 55045.0, 187918.0, 512813.0, 183346.0, 53758.0, 17265.0, 5963.0, 2360.0, 992.0, 512.0, 233.0, 139.0, 71.0, 41.0, 20.0, 21.0, 6.0, 4.0, 7.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.5, -55.96630859375, -54.4326171875, -52.89892578125, -51.365234375, -49.83154296875, -48.2978515625, -46.76416015625, -45.23046875, -43.69677734375, -42.1630859375, -40.62939453125, -39.095703125, -37.56201171875, -36.0283203125, -34.49462890625, -32.9609375, -31.42724609375, -29.8935546875, -28.35986328125, -26.826171875, -25.29248046875, -23.7587890625, -22.22509765625, -20.69140625, -19.15771484375, -17.6240234375, -16.09033203125, -14.556640625, -13.02294921875, -11.4892578125, -9.95556640625, -8.421875, -6.88818359375, -5.3544921875, -3.82080078125, -2.287109375, -0.75341796875, 0.7802734375, 2.31396484375, 3.84765625, 5.38134765625, 6.9150390625, 8.44873046875, 9.982421875, 11.51611328125, 13.0498046875, 14.58349609375, 16.1171875, 17.65087890625, 19.1845703125, 20.71826171875, 22.251953125, 23.78564453125, 25.3193359375, 26.85302734375, 28.38671875, 29.92041015625, 31.4541015625, 32.98779296875, 34.521484375, 36.05517578125, 37.5888671875, 39.12255859375, 40.65625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 23.0, 21.0, 27.0, 22.0, 50.0, 40.0, 45.0, 64.0, 64.0, 76.0, 67.0, 65.0, 79.0, 68.0, 64.0, 37.0, 37.0, 40.0, 20.0, 22.0, 16.0, 9.0, 11.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.34375, -26.6328125, -25.921875, -25.2109375, -24.5, -23.7890625, -23.078125, -22.3671875, -21.65625, -20.9453125, -20.234375, -19.5234375, -18.8125, -18.1015625, -17.390625, -16.6796875, -15.96875, -15.2578125, -14.546875, -13.8359375, -13.125, -12.4140625, -11.703125, -10.9921875, -10.28125, -9.5703125, -8.859375, -8.1484375, -7.4375, -6.7265625, -6.015625, -5.3046875, -4.59375, -3.8828125, -3.171875, -2.4609375, -1.75, -1.0390625, -0.328125, 0.3828125, 1.09375, 1.8046875, 2.515625, 3.2265625, 3.9375, 4.6484375, 5.359375, 6.0703125, 6.78125, 7.4921875, 8.203125, 8.9140625, 9.625, 10.3359375, 11.046875, 11.7578125, 12.46875, 13.1796875, 13.890625, 14.6015625, 15.3125, 16.0234375, 16.734375, 17.4453125, 18.15625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 4.0, 17.0, 10.0, 17.0, 19.0, 29.0, 49.0, 59.0, 113.0, 188.0, 342.0, 715.0, 1951.0, 9993.0, 204758.0, 796625.0, 27897.0, 3461.0, 1150.0, 459.0, 268.0, 148.0, 101.0, 55.0, 41.0, 21.0, 14.0, 13.0, 11.0, 6.0, 10.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-115.0625, -111.59765625, -108.1328125, -104.66796875, -101.203125, -97.73828125, -94.2734375, -90.80859375, -87.34375, -83.87890625, -80.4140625, -76.94921875, -73.484375, -70.01953125, -66.5546875, -63.08984375, -59.625, -56.16015625, -52.6953125, -49.23046875, -45.765625, -42.30078125, -38.8359375, -35.37109375, -31.90625, -28.44140625, -24.9765625, -21.51171875, -18.046875, -14.58203125, -11.1171875, -7.65234375, -4.1875, -0.72265625, 2.7421875, 6.20703125, 9.671875, 13.13671875, 16.6015625, 20.06640625, 23.53125, 26.99609375, 30.4609375, 33.92578125, 37.390625, 40.85546875, 44.3203125, 47.78515625, 51.25, 54.71484375, 58.1796875, 61.64453125, 65.109375, 68.57421875, 72.0390625, 75.50390625, 78.96875, 82.43359375, 85.8984375, 89.36328125, 92.828125, 96.29296875, 99.7578125, 103.22265625, 106.6875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 9.0, 12.0, 14.0, 16.0, 24.0, 36.0, 39.0, 29.0, 37.0, 42.0, 37.0, 55.0, 44.0, 68.0, 75.0, 61.0, 53.0, 52.0, 38.0, 41.0, 36.0, 40.0, 17.0, 15.0, 26.0, 12.0, 9.0, 11.0, 5.0, 8.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0, -72.552734375, -70.10546875, -67.658203125, -65.2109375, -62.763671875, -60.31640625, -57.869140625, -55.421875, -52.974609375, -50.52734375, -48.080078125, -45.6328125, -43.185546875, -40.73828125, -38.291015625, -35.84375, -33.396484375, -30.94921875, -28.501953125, -26.0546875, -23.607421875, -21.16015625, -18.712890625, -16.265625, -13.818359375, -11.37109375, -8.923828125, -6.4765625, -4.029296875, -1.58203125, 0.865234375, 3.3125, 5.759765625, 8.20703125, 10.654296875, 13.1015625, 15.548828125, 17.99609375, 20.443359375, 22.890625, 25.337890625, 27.78515625, 30.232421875, 32.6796875, 35.126953125, 37.57421875, 40.021484375, 42.46875, 44.916015625, 47.36328125, 49.810546875, 52.2578125, 54.705078125, 57.15234375, 59.599609375, 62.046875, 64.494140625, 66.94140625, 69.388671875, 71.8359375, 74.283203125, 76.73046875, 79.177734375, 81.625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 9.0, 10.0, 10.0, 16.0, 21.0, 22.0, 41.0, 49.0, 51.0, 101.0, 138.0, 189.0, 330.0, 466.0, 776.0, 1335.0, 2568.0, 5555.0, 13424.0, 39175.0, 144033.0, 545938.0, 209936.0, 53042.0, 17287.0, 6768.0, 3098.0, 1625.0, 903.0, 553.0, 350.0, 237.0, 144.0, 96.0, 71.0, 51.0, 39.0, 26.0, 22.0, 7.0, 5.0, 5.0, 9.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-16.40625, -15.9183349609375, -15.430419921875, -14.9425048828125, -14.45458984375, -13.9666748046875, -13.478759765625, -12.9908447265625, -12.5029296875, -12.0150146484375, -11.527099609375, -11.0391845703125, -10.55126953125, -10.0633544921875, -9.575439453125, -9.0875244140625, -8.599609375, -8.1116943359375, -7.623779296875, -7.1358642578125, -6.64794921875, -6.1600341796875, -5.672119140625, -5.1842041015625, -4.6962890625, -4.2083740234375, -3.720458984375, -3.2325439453125, -2.74462890625, -2.2567138671875, -1.768798828125, -1.2808837890625, -0.79296875, -0.3050537109375, 0.182861328125, 0.6707763671875, 1.15869140625, 1.6466064453125, 2.134521484375, 2.6224365234375, 3.1103515625, 3.5982666015625, 4.086181640625, 4.5740966796875, 5.06201171875, 5.5499267578125, 6.037841796875, 6.5257568359375, 7.013671875, 7.5015869140625, 7.989501953125, 8.4774169921875, 8.96533203125, 9.4532470703125, 9.941162109375, 10.4290771484375, 10.9169921875, 11.4049072265625, 11.892822265625, 12.3807373046875, 12.86865234375, 13.3565673828125, 13.844482421875, 14.3323974609375, 14.8203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 10.0, 12.0, 17.0, 11.0, 22.0, 32.0, 35.0, 49.0, 53.0, 60.0, 108.0, 136.0, 115.0, 69.0, 43.0, 33.0, 31.0, 26.0, 25.0, 22.0, 18.0, 14.0, 8.0, 6.0, 4.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004665374755859375, -0.0044901371002197266, -0.004314899444580078, -0.00413966178894043, -0.003964424133300781, -0.003789186477661133, -0.0036139488220214844, -0.003438711166381836, -0.0032634735107421875, -0.003088235855102539, -0.0029129981994628906, -0.002737760543823242, -0.0025625228881835938, -0.0023872852325439453, -0.002212047576904297, -0.0020368099212646484, -0.001861572265625, -0.0016863346099853516, -0.0015110969543457031, -0.0013358592987060547, -0.0011606216430664062, -0.0009853839874267578, -0.0008101463317871094, -0.0006349086761474609, -0.0004596710205078125, -0.00028443336486816406, -0.00010919570922851562, 6.604194641113281e-05, 0.00024127960205078125, 0.0004165172576904297, 0.0005917549133300781, 0.0007669925689697266, 0.000942230224609375, 0.0011174678802490234, 0.0012927055358886719, 0.0014679431915283203, 0.0016431808471679688, 0.0018184185028076172, 0.0019936561584472656, 0.002168893814086914, 0.0023441314697265625, 0.002519369125366211, 0.0026946067810058594, 0.002869844436645508, 0.0030450820922851562, 0.0032203197479248047, 0.003395557403564453, 0.0035707950592041016, 0.00374603271484375, 0.0039212703704833984, 0.004096508026123047, 0.004271745681762695, 0.004446983337402344, 0.004622220993041992, 0.004797458648681641, 0.004972696304321289, 0.0051479339599609375, 0.005323171615600586, 0.005498409271240234, 0.005673646926879883, 0.005848884582519531, 0.00602412223815918, 0.006199359893798828, 0.0063745975494384766, 0.006549835205078125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 6.0, 12.0, 12.0, 6.0, 22.0, 33.0, 34.0, 64.0, 153.0, 259.0, 584.0, 1623.0, 6686.0, 59173.0, 824423.0, 140199.0, 11378.0, 2432.0, 781.0, 313.0, 153.0, 75.0, 47.0, 30.0, 25.0, 7.0, 13.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.40625, -31.18994140625, -29.9736328125, -28.75732421875, -27.541015625, -26.32470703125, -25.1083984375, -23.89208984375, -22.67578125, -21.45947265625, -20.2431640625, -19.02685546875, -17.810546875, -16.59423828125, -15.3779296875, -14.16162109375, -12.9453125, -11.72900390625, -10.5126953125, -9.29638671875, -8.080078125, -6.86376953125, -5.6474609375, -4.43115234375, -3.21484375, -1.99853515625, -0.7822265625, 0.43408203125, 1.650390625, 2.86669921875, 4.0830078125, 5.29931640625, 6.515625, 7.73193359375, 8.9482421875, 10.16455078125, 11.380859375, 12.59716796875, 13.8134765625, 15.02978515625, 16.24609375, 17.46240234375, 18.6787109375, 19.89501953125, 21.111328125, 22.32763671875, 23.5439453125, 24.76025390625, 25.9765625, 27.19287109375, 28.4091796875, 29.62548828125, 30.841796875, 32.05810546875, 33.2744140625, 34.49072265625, 35.70703125, 36.92333984375, 38.1396484375, 39.35595703125, 40.572265625, 41.78857421875, 43.0048828125, 44.22119140625, 45.4375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 3.0, 6.0, 8.0, 10.0, 9.0, 17.0, 15.0, 14.0, 21.0, 22.0, 31.0, 56.0, 47.0, 65.0, 76.0, 78.0, 92.0, 87.0, 78.0, 51.0, 46.0, 38.0, 30.0, 21.0, 15.0, 16.0, 11.0, 6.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.578125, -19.921142578125, -19.26416015625, -18.607177734375, -17.9501953125, -17.293212890625, -16.63623046875, -15.979248046875, -15.322265625, -14.665283203125, -14.00830078125, -13.351318359375, -12.6943359375, -12.037353515625, -11.38037109375, -10.723388671875, -10.06640625, -9.409423828125, -8.75244140625, -8.095458984375, -7.4384765625, -6.781494140625, -6.12451171875, -5.467529296875, -4.810546875, -4.153564453125, -3.49658203125, -2.839599609375, -2.1826171875, -1.525634765625, -0.86865234375, -0.211669921875, 0.4453125, 1.102294921875, 1.75927734375, 2.416259765625, 3.0732421875, 3.730224609375, 4.38720703125, 5.044189453125, 5.701171875, 6.358154296875, 7.01513671875, 7.672119140625, 8.3291015625, 8.986083984375, 9.64306640625, 10.300048828125, 10.95703125, 11.614013671875, 12.27099609375, 12.927978515625, 13.5849609375, 14.241943359375, 14.89892578125, 15.555908203125, 16.212890625, 16.869873046875, 17.52685546875, 18.183837890625, 18.8408203125, 19.497802734375, 20.15478515625, 20.811767578125, 21.46875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 14.0, 21.0, 53.0, 135.0, 205.0, 229.0, 150.0, 94.0, 56.0, 21.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-654.52978515625, -634.3231811523438, -614.1166381835938, -593.9100341796875, -573.7034301757812, -553.496826171875, -533.290283203125, -513.0836791992188, -492.8771057128906, -472.6705322265625, -452.46392822265625, -432.2573547363281, -412.05078125, -391.84417724609375, -371.6376037597656, -351.4310302734375, -331.22442626953125, -311.0178527832031, -290.8112487792969, -270.60467529296875, -250.39808654785156, -230.19149780273438, -209.98492431640625, -189.77833557128906, -169.57174682617188, -149.3651580810547, -129.1585693359375, -108.95199584960938, -88.74540710449219, -68.538818359375, -48.332237243652344, -28.125656127929688, -7.91900634765625, 12.287578582763672, 32.494163513183594, 52.700748443603516, 72.90733337402344, 93.11392211914062, 113.32050323486328, 133.52708435058594, 153.73367309570312, 173.9402618408203, 194.1468505859375, 214.35342407226562, 234.5600128173828, 254.7666015625, 274.9731750488281, 295.17974853515625, 315.3863525390625, 335.5929260253906, 355.7995300292969, 376.006103515625, 396.21270751953125, 416.4192810058594, 436.6258544921875, 456.83245849609375, 477.0390319824219, 497.24560546875, 517.4522094726562, 537.6588134765625, 557.8653564453125, 578.0719604492188, 598.278564453125, 618.485107421875, 638.6917114257812]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 3.0, 8.0, 10.0, 11.0, 14.0, 16.0, 14.0, 17.0, 18.0, 24.0, 34.0, 36.0, 23.0, 38.0, 47.0, 49.0, 52.0, 45.0, 37.0, 37.0, 45.0, 49.0, 35.0, 40.0, 42.0, 27.0, 31.0, 24.0, 26.0, 25.0, 21.0, 11.0, 12.0, 13.0, 15.0, 12.0, 3.0, 9.0, 1.0, 8.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-234.61538696289062, -225.93736267089844, -217.25933837890625, -208.58131408691406, -199.90328979492188, -191.22525024414062, -182.54722595214844, -173.86920166015625, -165.19117736816406, -156.51315307617188, -147.8351287841797, -139.1571044921875, -130.47906494140625, -121.8010482788086, -113.12301635742188, -104.44499206542969, -95.7669677734375, -87.08894348144531, -78.41091918945312, -69.7328872680664, -61.05486297607422, -52.37683868408203, -43.69881057739258, -35.020782470703125, -26.342758178710938, -17.664731979370117, -8.986705780029297, -0.30867958068847656, 8.369346618652344, 17.04737091064453, 25.725399017333984, 34.40342712402344, 43.0814208984375, 51.75944519042969, 60.43747329711914, 69.1155014038086, 77.79352569580078, 86.47154998779297, 95.14958190917969, 103.82760620117188, 112.50563049316406, 121.18365478515625, 129.86167907714844, 138.53970336914062, 147.21774291992188, 155.895751953125, 164.57379150390625, 173.25181579589844, 181.92984008789062, 190.6078643798828, 199.285888671875, 207.9639129638672, 216.64193725585938, 225.31997680664062, 233.9980010986328, 242.676025390625, 251.3540496826172, 260.0320739746094, 268.7101135253906, 277.38812255859375, 286.066162109375, 294.7441711425781, 303.4222106933594, 312.1002197265625, 320.77825927734375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 8.0, 16.0, 31.0, 25.0, 47.0, 57.0, 109.0, 118.0, 208.0, 289.0, 412.0, 680.0, 987.0, 1660.0, 2665.0, 4582.0, 8298.0, 15517.0, 34081.0, 91661.0, 395393.0, 2278083.0, 1068718.0, 185578.0, 55204.0, 23172.0, 11363.0, 6014.0, 3456.0, 1990.0, 1318.0, 795.0, 528.0, 373.0, 241.0, 184.0, 109.0, 106.0, 54.0, 34.0, 35.0, 17.0, 21.0, 10.0, 3.0, 6.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-21.40625, -20.71044921875, -20.0146484375, -19.31884765625, -18.623046875, -17.92724609375, -17.2314453125, -16.53564453125, -15.83984375, -15.14404296875, -14.4482421875, -13.75244140625, -13.056640625, -12.36083984375, -11.6650390625, -10.96923828125, -10.2734375, -9.57763671875, -8.8818359375, -8.18603515625, -7.490234375, -6.79443359375, -6.0986328125, -5.40283203125, -4.70703125, -4.01123046875, -3.3154296875, -2.61962890625, -1.923828125, -1.22802734375, -0.5322265625, 0.16357421875, 0.859375, 1.55517578125, 2.2509765625, 2.94677734375, 3.642578125, 4.33837890625, 5.0341796875, 5.72998046875, 6.42578125, 7.12158203125, 7.8173828125, 8.51318359375, 9.208984375, 9.90478515625, 10.6005859375, 11.29638671875, 11.9921875, 12.68798828125, 13.3837890625, 14.07958984375, 14.775390625, 15.47119140625, 16.1669921875, 16.86279296875, 17.55859375, 18.25439453125, 18.9501953125, 19.64599609375, 20.341796875, 21.03759765625, 21.7333984375, 22.42919921875, 23.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 4.0, 5.0, 7.0, 5.0, 12.0, 12.0, 10.0, 17.0, 17.0, 21.0, 25.0, 22.0, 30.0, 24.0, 32.0, 42.0, 48.0, 36.0, 44.0, 45.0, 43.0, 46.0, 48.0, 48.0, 38.0, 38.0, 42.0, 39.0, 30.0, 27.0, 31.0, 17.0, 21.0, 16.0, 10.0, 10.0, 11.0, 7.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.03125, -12.5894775390625, -12.147705078125, -11.7059326171875, -11.26416015625, -10.8223876953125, -10.380615234375, -9.9388427734375, -9.4970703125, -9.0552978515625, -8.613525390625, -8.1717529296875, -7.72998046875, -7.2882080078125, -6.846435546875, -6.4046630859375, -5.962890625, -5.5211181640625, -5.079345703125, -4.6375732421875, -4.19580078125, -3.7540283203125, -3.312255859375, -2.8704833984375, -2.4287109375, -1.9869384765625, -1.545166015625, -1.1033935546875, -0.66162109375, -0.2198486328125, 0.221923828125, 0.6636962890625, 1.10546875, 1.5472412109375, 1.989013671875, 2.4307861328125, 2.87255859375, 3.3143310546875, 3.756103515625, 4.1978759765625, 4.6396484375, 5.0814208984375, 5.523193359375, 5.9649658203125, 6.40673828125, 6.8485107421875, 7.290283203125, 7.7320556640625, 8.173828125, 8.6156005859375, 9.057373046875, 9.4991455078125, 9.94091796875, 10.3826904296875, 10.824462890625, 11.2662353515625, 11.7080078125, 12.1497802734375, 12.591552734375, 13.0333251953125, 13.47509765625, 13.9168701171875, 14.358642578125, 14.8004150390625, 15.2421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 1.0, 5.0, 1.0, 1.0, 12.0, 12.0, 21.0, 18.0, 23.0, 42.0, 93.0, 102.0, 198.0, 347.0, 671.0, 1369.0, 3233.0, 9162.0, 36854.0, 280708.0, 3526244.0, 282902.0, 36683.0, 9309.0, 3283.0, 1378.0, 725.0, 352.0, 205.0, 113.0, 79.0, 48.0, 28.0, 20.0, 10.0, 5.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-64.5, -62.73291015625, -60.9658203125, -59.19873046875, -57.431640625, -55.66455078125, -53.8974609375, -52.13037109375, -50.36328125, -48.59619140625, -46.8291015625, -45.06201171875, -43.294921875, -41.52783203125, -39.7607421875, -37.99365234375, -36.2265625, -34.45947265625, -32.6923828125, -30.92529296875, -29.158203125, -27.39111328125, -25.6240234375, -23.85693359375, -22.08984375, -20.32275390625, -18.5556640625, -16.78857421875, -15.021484375, -13.25439453125, -11.4873046875, -9.72021484375, -7.953125, -6.18603515625, -4.4189453125, -2.65185546875, -0.884765625, 0.88232421875, 2.6494140625, 4.41650390625, 6.18359375, 7.95068359375, 9.7177734375, 11.48486328125, 13.251953125, 15.01904296875, 16.7861328125, 18.55322265625, 20.3203125, 22.08740234375, 23.8544921875, 25.62158203125, 27.388671875, 29.15576171875, 30.9228515625, 32.68994140625, 34.45703125, 36.22412109375, 37.9912109375, 39.75830078125, 41.525390625, 43.29248046875, 45.0595703125, 46.82666015625, 48.59375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 5.0, 6.0, 6.0, 11.0, 16.0, 18.0, 29.0, 50.0, 60.0, 104.0, 184.0, 340.0, 674.0, 1075.0, 670.0, 300.0, 191.0, 108.0, 58.0, 36.0, 28.0, 26.0, 10.0, 18.0, 9.0, 9.0, 2.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-65.3125, -63.521484375, -61.73046875, -59.939453125, -58.1484375, -56.357421875, -54.56640625, -52.775390625, -50.984375, -49.193359375, -47.40234375, -45.611328125, -43.8203125, -42.029296875, -40.23828125, -38.447265625, -36.65625, -34.865234375, -33.07421875, -31.283203125, -29.4921875, -27.701171875, -25.91015625, -24.119140625, -22.328125, -20.537109375, -18.74609375, -16.955078125, -15.1640625, -13.373046875, -11.58203125, -9.791015625, -8.0, -6.208984375, -4.41796875, -2.626953125, -0.8359375, 0.955078125, 2.74609375, 4.537109375, 6.328125, 8.119140625, 9.91015625, 11.701171875, 13.4921875, 15.283203125, 17.07421875, 18.865234375, 20.65625, 22.447265625, 24.23828125, 26.029296875, 27.8203125, 29.611328125, 31.40234375, 33.193359375, 34.984375, 36.775390625, 38.56640625, 40.357421875, 42.1484375, 43.939453125, 45.73046875, 47.521484375, 49.3125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 15.0, 14.0, 26.0, 40.0, 61.0, 103.0, 188.0, 185.0, 152.0, 81.0, 56.0, 31.0, 14.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-579.1993408203125, -563.2213745117188, -547.2434692382812, -531.2655029296875, -515.2875366210938, -499.30963134765625, -483.3316650390625, -467.3537292480469, -451.37579345703125, -435.3978576660156, -419.4198913574219, -403.44195556640625, -387.4640197753906, -371.486083984375, -355.50811767578125, -339.5301818847656, -323.5522155761719, -307.57427978515625, -291.5963134765625, -275.6183776855469, -259.64044189453125, -243.66249084472656, -227.68453979492188, -211.70660400390625, -195.72865295410156, -179.75070190429688, -163.77276611328125, -147.79481506347656, -131.81686401367188, -115.83892822265625, -99.86097717285156, -83.8830337524414, -67.90512084960938, -51.92717742919922, -35.9492301940918, -19.971282958984375, -3.9933395385742188, 11.984603881835938, 27.962554931640625, 43.94049835205078, 59.91844177246094, 75.8963851928711, 91.87432861328125, 107.85227966308594, 123.8302230834961, 139.80816650390625, 155.78611755371094, 171.76406860351562, 187.74200439453125, 203.71995544433594, 219.69789123535156, 235.67584228515625, 251.65377807617188, 267.6317138671875, 283.60968017578125, 299.5876159667969, 315.5655517578125, 331.5434875488281, 347.5214538574219, 363.4993896484375, 379.4773254394531, 395.45526123046875, 411.4332275390625, 427.4111633300781, 443.3891296386719]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 7.0, 1.0, 4.0, 12.0, 13.0, 15.0, 20.0, 28.0, 31.0, 26.0, 30.0, 44.0, 30.0, 31.0, 40.0, 46.0, 47.0, 40.0, 40.0, 40.0, 38.0, 52.0, 46.0, 35.0, 31.0, 28.0, 35.0, 26.0, 32.0, 8.0, 19.0, 22.0, 17.0, 13.0, 11.0, 9.0, 6.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-211.9520263671875, -205.6383056640625, -199.3245849609375, -193.01084899902344, -186.69712829589844, -180.38340759277344, -174.06967163085938, -167.75595092773438, -161.44223022460938, -155.12850952148438, -148.81478881835938, -142.5010528564453, -136.1873321533203, -129.8736114501953, -123.55988311767578, -117.24615478515625, -110.93243408203125, -104.61871337890625, -98.30498504638672, -91.99125671386719, -85.67753601074219, -79.36381530761719, -73.05008697509766, -66.73635864257812, -60.422637939453125, -54.10891342163086, -47.795188903808594, -41.48146438598633, -35.16773986816406, -28.854015350341797, -22.54029083251953, -16.226566314697266, -9.912857055664062, -3.599132537841797, 2.7145919799804688, 9.028316497802734, 15.342041015625, 21.655765533447266, 27.96949005126953, 34.2832145690918, 40.59693908691406, 46.91066360473633, 53.224388122558594, 59.53811264038086, 65.85183715820312, 72.16555786132812, 78.47928619384766, 84.79301452636719, 91.10673522949219, 97.42045593261719, 103.73418426513672, 110.04791259765625, 116.36163330078125, 122.67535400390625, 128.98907470703125, 135.3028106689453, 141.6165313720703, 147.9302520751953, 154.24398803710938, 160.55770874023438, 166.87142944335938, 173.18515014648438, 179.49887084960938, 185.81260681152344, 192.12632751464844]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 12.0, 13.0, 15.0, 27.0, 32.0, 63.0, 80.0, 121.0, 208.0, 330.0, 601.0, 939.0, 1661.0, 2968.0, 5658.0, 10758.0, 21929.0, 48527.0, 127882.0, 398265.0, 273544.0, 84540.0, 35445.0, 16606.0, 8252.0, 4356.0, 2342.0, 1312.0, 803.0, 482.0, 297.0, 155.0, 114.0, 75.0, 41.0, 29.0, 17.0, 15.0, 16.0, 5.0, 3.0, 7.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.28125, -31.2333984375, -30.185546875, -29.1376953125, -28.08984375, -27.0419921875, -25.994140625, -24.9462890625, -23.8984375, -22.8505859375, -21.802734375, -20.7548828125, -19.70703125, -18.6591796875, -17.611328125, -16.5634765625, -15.515625, -14.4677734375, -13.419921875, -12.3720703125, -11.32421875, -10.2763671875, -9.228515625, -8.1806640625, -7.1328125, -6.0849609375, -5.037109375, -3.9892578125, -2.94140625, -1.8935546875, -0.845703125, 0.2021484375, 1.25, 2.2978515625, 3.345703125, 4.3935546875, 5.44140625, 6.4892578125, 7.537109375, 8.5849609375, 9.6328125, 10.6806640625, 11.728515625, 12.7763671875, 13.82421875, 14.8720703125, 15.919921875, 16.9677734375, 18.015625, 19.0634765625, 20.111328125, 21.1591796875, 22.20703125, 23.2548828125, 24.302734375, 25.3505859375, 26.3984375, 27.4462890625, 28.494140625, 29.5419921875, 30.58984375, 31.6376953125, 32.685546875, 33.7333984375, 34.78125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 8.0, 8.0, 8.0, 12.0, 17.0, 13.0, 24.0, 30.0, 26.0, 19.0, 29.0, 32.0, 36.0, 34.0, 46.0, 46.0, 42.0, 58.0, 45.0, 47.0, 56.0, 42.0, 54.0, 33.0, 27.0, 39.0, 23.0, 23.0, 23.0, 11.0, 13.0, 12.0, 11.0, 9.0, 11.0, 5.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.125, -15.6556396484375, -15.186279296875, -14.7169189453125, -14.24755859375, -13.7781982421875, -13.308837890625, -12.8394775390625, -12.3701171875, -11.9007568359375, -11.431396484375, -10.9620361328125, -10.49267578125, -10.0233154296875, -9.553955078125, -9.0845947265625, -8.615234375, -8.1458740234375, -7.676513671875, -7.2071533203125, -6.73779296875, -6.2684326171875, -5.799072265625, -5.3297119140625, -4.8603515625, -4.3909912109375, -3.921630859375, -3.4522705078125, -2.98291015625, -2.5135498046875, -2.044189453125, -1.5748291015625, -1.10546875, -0.6361083984375, -0.166748046875, 0.3026123046875, 0.77197265625, 1.2413330078125, 1.710693359375, 2.1800537109375, 2.6494140625, 3.1187744140625, 3.588134765625, 4.0574951171875, 4.52685546875, 4.9962158203125, 5.465576171875, 5.9349365234375, 6.404296875, 6.8736572265625, 7.343017578125, 7.8123779296875, 8.28173828125, 8.7510986328125, 9.220458984375, 9.6898193359375, 10.1591796875, 10.6285400390625, 11.097900390625, 11.5672607421875, 12.03662109375, 12.5059814453125, 12.975341796875, 13.4447021484375, 13.9140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 0.0, 3.0, 7.0, 5.0, 13.0, 14.0, 12.0, 34.0, 40.0, 39.0, 78.0, 105.0, 191.0, 324.0, 684.0, 1624.0, 5370.0, 42067.0, 885242.0, 99777.0, 8802.0, 2187.0, 895.0, 404.0, 249.0, 128.0, 90.0, 50.0, 31.0, 28.0, 16.0, 16.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-123.375, -119.7080078125, -116.041015625, -112.3740234375, -108.70703125, -105.0400390625, -101.373046875, -97.7060546875, -94.0390625, -90.3720703125, -86.705078125, -83.0380859375, -79.37109375, -75.7041015625, -72.037109375, -68.3701171875, -64.703125, -61.0361328125, -57.369140625, -53.7021484375, -50.03515625, -46.3681640625, -42.701171875, -39.0341796875, -35.3671875, -31.7001953125, -28.033203125, -24.3662109375, -20.69921875, -17.0322265625, -13.365234375, -9.6982421875, -6.03125, -2.3642578125, 1.302734375, 4.9697265625, 8.63671875, 12.3037109375, 15.970703125, 19.6376953125, 23.3046875, 26.9716796875, 30.638671875, 34.3056640625, 37.97265625, 41.6396484375, 45.306640625, 48.9736328125, 52.640625, 56.3076171875, 59.974609375, 63.6416015625, 67.30859375, 70.9755859375, 74.642578125, 78.3095703125, 81.9765625, 85.6435546875, 89.310546875, 92.9775390625, 96.64453125, 100.3115234375, 103.978515625, 107.6455078125, 111.3125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 15.0, 14.0, 16.0, 22.0, 19.0, 21.0, 26.0, 34.0, 38.0, 40.0, 51.0, 49.0, 51.0, 46.0, 64.0, 44.0, 42.0, 49.0, 51.0, 51.0, 36.0, 40.0, 26.0, 32.0, 22.0, 22.0, 18.0, 8.0, 11.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-96.3125, -93.689453125, -91.06640625, -88.443359375, -85.8203125, -83.197265625, -80.57421875, -77.951171875, -75.328125, -72.705078125, -70.08203125, -67.458984375, -64.8359375, -62.212890625, -59.58984375, -56.966796875, -54.34375, -51.720703125, -49.09765625, -46.474609375, -43.8515625, -41.228515625, -38.60546875, -35.982421875, -33.359375, -30.736328125, -28.11328125, -25.490234375, -22.8671875, -20.244140625, -17.62109375, -14.998046875, -12.375, -9.751953125, -7.12890625, -4.505859375, -1.8828125, 0.740234375, 3.36328125, 5.986328125, 8.609375, 11.232421875, 13.85546875, 16.478515625, 19.1015625, 21.724609375, 24.34765625, 26.970703125, 29.59375, 32.216796875, 34.83984375, 37.462890625, 40.0859375, 42.708984375, 45.33203125, 47.955078125, 50.578125, 53.201171875, 55.82421875, 58.447265625, 61.0703125, 63.693359375, 66.31640625, 68.939453125, 71.5625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 4.0, 6.0, 0.0, 3.0, 4.0, 13.0, 17.0, 17.0, 34.0, 46.0, 69.0, 103.0, 177.0, 293.0, 556.0, 1119.0, 3016.0, 9479.0, 43598.0, 589325.0, 353679.0, 34112.0, 7946.0, 2677.0, 1051.0, 463.0, 278.0, 166.0, 104.0, 51.0, 40.0, 33.0, 21.0, 14.0, 8.0, 10.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.625, -30.568359375, -29.51171875, -28.455078125, -27.3984375, -26.341796875, -25.28515625, -24.228515625, -23.171875, -22.115234375, -21.05859375, -20.001953125, -18.9453125, -17.888671875, -16.83203125, -15.775390625, -14.71875, -13.662109375, -12.60546875, -11.548828125, -10.4921875, -9.435546875, -8.37890625, -7.322265625, -6.265625, -5.208984375, -4.15234375, -3.095703125, -2.0390625, -0.982421875, 0.07421875, 1.130859375, 2.1875, 3.244140625, 4.30078125, 5.357421875, 6.4140625, 7.470703125, 8.52734375, 9.583984375, 10.640625, 11.697265625, 12.75390625, 13.810546875, 14.8671875, 15.923828125, 16.98046875, 18.037109375, 19.09375, 20.150390625, 21.20703125, 22.263671875, 23.3203125, 24.376953125, 25.43359375, 26.490234375, 27.546875, 28.603515625, 29.66015625, 30.716796875, 31.7734375, 32.830078125, 33.88671875, 34.943359375, 36.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 14.0, 18.0, 24.0, 43.0, 68.0, 168.0, 299.0, 159.0, 80.0, 36.0, 27.0, 10.0, 9.0, 12.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01123046875, -0.010807275772094727, -0.010384082794189453, -0.00996088981628418, -0.009537696838378906, -0.009114503860473633, -0.00869131088256836, -0.008268117904663086, -0.007844924926757812, -0.007421731948852539, -0.006998538970947266, -0.006575345993041992, -0.006152153015136719, -0.005728960037231445, -0.005305767059326172, -0.0048825740814208984, -0.004459381103515625, -0.0040361881256103516, -0.003612995147705078, -0.0031898021697998047, -0.0027666091918945312, -0.002343416213989258, -0.0019202232360839844, -0.001497030258178711, -0.0010738372802734375, -0.0006506443023681641, -0.00022745132446289062, 0.0001957416534423828, 0.0006189346313476562, 0.0010421276092529297, 0.0014653205871582031, 0.0018885135650634766, 0.00231170654296875, 0.0027348995208740234, 0.003158092498779297, 0.0035812854766845703, 0.004004478454589844, 0.004427671432495117, 0.004850864410400391, 0.005274057388305664, 0.0056972503662109375, 0.006120443344116211, 0.006543636322021484, 0.006966829299926758, 0.007390022277832031, 0.007813215255737305, 0.008236408233642578, 0.008659601211547852, 0.009082794189453125, 0.009505987167358398, 0.009929180145263672, 0.010352373123168945, 0.010775566101074219, 0.011198759078979492, 0.011621952056884766, 0.012045145034790039, 0.012468338012695312, 0.012891530990600586, 0.01331472396850586, 0.013737916946411133, 0.014161109924316406, 0.01458430290222168, 0.015007495880126953, 0.015430688858032227, 0.0158538818359375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 9.0, 9.0, 13.0, 31.0, 44.0, 46.0, 103.0, 160.0, 299.0, 644.0, 1619.0, 5760.0, 39874.0, 812286.0, 169935.0, 12775.0, 2930.0, 982.0, 455.0, 229.0, 117.0, 75.0, 53.0, 28.0, 12.0, 11.0, 12.0, 8.0, 6.0, 3.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.9375, -48.5, -47.0625, -45.625, -44.1875, -42.75, -41.3125, -39.875, -38.4375, -37.0, -35.5625, -34.125, -32.6875, -31.25, -29.8125, -28.375, -26.9375, -25.5, -24.0625, -22.625, -21.1875, -19.75, -18.3125, -16.875, -15.4375, -14.0, -12.5625, -11.125, -9.6875, -8.25, -6.8125, -5.375, -3.9375, -2.5, -1.0625, 0.375, 1.8125, 3.25, 4.6875, 6.125, 7.5625, 9.0, 10.4375, 11.875, 13.3125, 14.75, 16.1875, 17.625, 19.0625, 20.5, 21.9375, 23.375, 24.8125, 26.25, 27.6875, 29.125, 30.5625, 32.0, 33.4375, 34.875, 36.3125, 37.75, 39.1875, 40.625, 42.0625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 10.0, 8.0, 26.0, 21.0, 22.0, 49.0, 30.0, 43.0, 40.0, 67.0, 75.0, 87.0, 67.0, 74.0, 78.0, 50.0, 41.0, 43.0, 37.0, 17.0, 17.0, 20.0, 12.0, 7.0, 15.0, 4.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.0, -24.262939453125, -23.52587890625, -22.788818359375, -22.0517578125, -21.314697265625, -20.57763671875, -19.840576171875, -19.103515625, -18.366455078125, -17.62939453125, -16.892333984375, -16.1552734375, -15.418212890625, -14.68115234375, -13.944091796875, -13.20703125, -12.469970703125, -11.73291015625, -10.995849609375, -10.2587890625, -9.521728515625, -8.78466796875, -8.047607421875, -7.310546875, -6.573486328125, -5.83642578125, -5.099365234375, -4.3623046875, -3.625244140625, -2.88818359375, -2.151123046875, -1.4140625, -0.677001953125, 0.06005859375, 0.797119140625, 1.5341796875, 2.271240234375, 3.00830078125, 3.745361328125, 4.482421875, 5.219482421875, 5.95654296875, 6.693603515625, 7.4306640625, 8.167724609375, 8.90478515625, 9.641845703125, 10.37890625, 11.115966796875, 11.85302734375, 12.590087890625, 13.3271484375, 14.064208984375, 14.80126953125, 15.538330078125, 16.275390625, 17.012451171875, 17.74951171875, 18.486572265625, 19.2236328125, 19.960693359375, 20.69775390625, 21.434814453125, 22.171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 49.0, 102.0, 228.0, 285.0, 168.0, 82.0, 24.0, 17.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-892.9130859375, -867.6424560546875, -842.3717651367188, -817.1011352539062, -791.8304443359375, -766.559814453125, -741.2891845703125, -716.0184936523438, -690.747802734375, -665.4771728515625, -640.2064819335938, -614.9358520507812, -589.6651611328125, -564.39453125, -539.1239013671875, -513.8532104492188, -488.58258056640625, -463.3119201660156, -438.041259765625, -412.7706298828125, -387.49993896484375, -362.22930908203125, -336.9586486816406, -311.68798828125, -286.4173278808594, -261.14666748046875, -235.87600708007812, -210.60536193847656, -185.33470153808594, -160.0640411376953, -134.79339599609375, -109.52273559570312, -84.25201416015625, -58.98135757446289, -33.71070098876953, -8.440048217773438, 16.830612182617188, 42.10127258300781, 67.37191772460938, 92.642578125, 117.91323852539062, 143.18389892578125, 168.45455932617188, 193.72520446777344, 218.99586486816406, 244.2665252685547, 269.53717041015625, 294.8078308105469, 320.0784912109375, 345.3491516113281, 370.61981201171875, 395.89044189453125, 421.1611328125, 446.4317626953125, 471.7024230957031, 496.97308349609375, 522.2437744140625, 547.514404296875, 572.7850952148438, 598.0557250976562, 623.326416015625, 648.5970458984375, 673.86767578125, 699.1383666992188, 724.4089965820312]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 10.0, 6.0, 7.0, 9.0, 8.0, 17.0, 21.0, 19.0, 23.0, 27.0, 36.0, 50.0, 50.0, 49.0, 55.0, 68.0, 64.0, 55.0, 65.0, 64.0, 46.0, 41.0, 31.0, 23.0, 35.0, 23.0, 25.0, 18.0, 12.0, 16.0, 11.0, 5.0, 5.0, 3.0, 0.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.068603515625, -311.17230224609375, -300.2759704589844, -289.3796691894531, -278.4833679199219, -267.5870361328125, -256.69073486328125, -245.79443359375, -234.8981170654297, -224.00180053710938, -213.10549926757812, -202.2091827392578, -191.3128662109375, -180.41656494140625, -169.52024841308594, -158.62393188476562, -147.72763061523438, -136.83131408691406, -125.93501281738281, -115.0386962890625, -104.14238739013672, -93.24607849121094, -82.34976196289062, -71.45345306396484, -60.55714416503906, -49.66083526611328, -38.764522552490234, -27.868209838867188, -16.971900939941406, -6.075592041015625, 4.8207244873046875, 15.717033386230469, 26.613311767578125, 37.509620666503906, 48.40593338012695, 59.30224609375, 70.19855499267578, 81.09486389160156, 91.99118041992188, 102.88748931884766, 113.78379821777344, 124.68010711669922, 135.576416015625, 146.4727325439453, 157.36904907226562, 168.26535034179688, 179.1616668701172, 190.0579833984375, 200.95428466796875, 211.85060119628906, 222.7469024658203, 233.64321899414062, 244.53952026367188, 255.4358367919922, 266.3321533203125, 277.22845458984375, 288.124755859375, 299.02105712890625, 309.9173889160156, 320.8136901855469, 331.7099914550781, 342.6063232421875, 353.50262451171875, 364.39892578125, 375.2952575683594]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 5.0, 12.0, 12.0, 14.0, 17.0, 31.0, 45.0, 49.0, 88.0, 124.0, 280.0, 3327.0, 1225116.0, 2960126.0, 4253.0, 353.0, 117.0, 90.0, 57.0, 42.0, 30.0, 22.0, 17.0, 11.0, 19.0, 6.0, 0.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.125, -148.19140625, -143.2578125, -138.32421875, -133.390625, -128.45703125, -123.5234375, -118.58984375, -113.65625, -108.72265625, -103.7890625, -98.85546875, -93.921875, -88.98828125, -84.0546875, -79.12109375, -74.1875, -69.25390625, -64.3203125, -59.38671875, -54.453125, -49.51953125, -44.5859375, -39.65234375, -34.71875, -29.78515625, -24.8515625, -19.91796875, -14.984375, -10.05078125, -5.1171875, -0.18359375, 4.75, 9.68359375, 14.6171875, 19.55078125, 24.484375, 29.41796875, 34.3515625, 39.28515625, 44.21875, 49.15234375, 54.0859375, 59.01953125, 63.953125, 68.88671875, 73.8203125, 78.75390625, 83.6875, 88.62109375, 93.5546875, 98.48828125, 103.421875, 108.35546875, 113.2890625, 118.22265625, 123.15625, 128.08984375, 133.0234375, 137.95703125, 142.890625, 147.82421875, 152.7578125, 157.69140625, 162.625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 4.0, 10.0, 4.0, 9.0, 8.0, 13.0, 15.0, 32.0, 37.0, 27.0, 45.0, 53.0, 61.0, 71.0, 70.0, 63.0, 71.0, 70.0, 55.0, 50.0, 61.0, 45.0, 39.0, 23.0, 15.0, 17.0, 15.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.0499267578125, -14.388916015625, -13.7279052734375, -13.06689453125, -12.4058837890625, -11.744873046875, -11.0838623046875, -10.4228515625, -9.7618408203125, -9.100830078125, -8.4398193359375, -7.77880859375, -7.1177978515625, -6.456787109375, -5.7957763671875, -5.134765625, -4.4737548828125, -3.812744140625, -3.1517333984375, -2.49072265625, -1.8297119140625, -1.168701171875, -0.5076904296875, 0.1533203125, 0.8143310546875, 1.475341796875, 2.1363525390625, 2.79736328125, 3.4583740234375, 4.119384765625, 4.7803955078125, 5.44140625, 6.1024169921875, 6.763427734375, 7.4244384765625, 8.08544921875, 8.7464599609375, 9.407470703125, 10.0684814453125, 10.7294921875, 11.3905029296875, 12.051513671875, 12.7125244140625, 13.37353515625, 14.0345458984375, 14.695556640625, 15.3565673828125, 16.017578125, 16.6785888671875, 17.339599609375, 18.0006103515625, 18.66162109375, 19.3226318359375, 19.983642578125, 20.6446533203125, 21.3056640625, 21.9666748046875, 22.627685546875, 23.2886962890625, 23.94970703125, 24.6107177734375, 25.271728515625, 25.9327392578125, 26.59375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 2.0, 13.0, 16.0, 19.0, 29.0, 51.0, 80.0, 139.0, 206.0, 332.0, 643.0, 1160.0, 2162.0, 4568.0, 10696.0, 28556.0, 101457.0, 828424.0, 2844014.0, 281927.0, 56051.0, 18701.0, 7664.0, 3484.0, 1720.0, 845.0, 512.0, 309.0, 170.0, 118.0, 62.0, 48.0, 30.0, 19.0, 11.0, 14.0, 7.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-36.34375, -35.1025390625, -33.861328125, -32.6201171875, -31.37890625, -30.1376953125, -28.896484375, -27.6552734375, -26.4140625, -25.1728515625, -23.931640625, -22.6904296875, -21.44921875, -20.2080078125, -18.966796875, -17.7255859375, -16.484375, -15.2431640625, -14.001953125, -12.7607421875, -11.51953125, -10.2783203125, -9.037109375, -7.7958984375, -6.5546875, -5.3134765625, -4.072265625, -2.8310546875, -1.58984375, -0.3486328125, 0.892578125, 2.1337890625, 3.375, 4.6162109375, 5.857421875, 7.0986328125, 8.33984375, 9.5810546875, 10.822265625, 12.0634765625, 13.3046875, 14.5458984375, 15.787109375, 17.0283203125, 18.26953125, 19.5107421875, 20.751953125, 21.9931640625, 23.234375, 24.4755859375, 25.716796875, 26.9580078125, 28.19921875, 29.4404296875, 30.681640625, 31.9228515625, 33.1640625, 34.4052734375, 35.646484375, 36.8876953125, 38.12890625, 39.3701171875, 40.611328125, 41.8525390625, 43.09375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 7.0, 12.0, 18.0, 20.0, 29.0, 49.0, 63.0, 87.0, 161.0, 253.0, 492.0, 811.0, 763.0, 517.0, 287.0, 162.0, 98.0, 58.0, 40.0, 29.0, 24.0, 25.0, 5.0, 12.0, 7.0, 5.0, 10.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.40625, -45.82275390625, -44.2392578125, -42.65576171875, -41.072265625, -39.48876953125, -37.9052734375, -36.32177734375, -34.73828125, -33.15478515625, -31.5712890625, -29.98779296875, -28.404296875, -26.82080078125, -25.2373046875, -23.65380859375, -22.0703125, -20.48681640625, -18.9033203125, -17.31982421875, -15.736328125, -14.15283203125, -12.5693359375, -10.98583984375, -9.40234375, -7.81884765625, -6.2353515625, -4.65185546875, -3.068359375, -1.48486328125, 0.0986328125, 1.68212890625, 3.265625, 4.84912109375, 6.4326171875, 8.01611328125, 9.599609375, 11.18310546875, 12.7666015625, 14.35009765625, 15.93359375, 17.51708984375, 19.1005859375, 20.68408203125, 22.267578125, 23.85107421875, 25.4345703125, 27.01806640625, 28.6015625, 30.18505859375, 31.7685546875, 33.35205078125, 34.935546875, 36.51904296875, 38.1025390625, 39.68603515625, 41.26953125, 42.85302734375, 44.4365234375, 46.02001953125, 47.603515625, 49.18701171875, 50.7705078125, 52.35400390625, 53.9375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 29.0, 71.0, 151.0, 246.0, 218.0, 142.0, 60.0, 26.0, 7.0, 7.0, 5.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-771.695556640625, -752.2750244140625, -732.8544311523438, -713.433837890625, -694.0133056640625, -674.5927734375, -655.1721801757812, -635.7515869140625, -616.3310546875, -596.9105224609375, -577.4899291992188, -558.0693359375, -538.6488037109375, -519.228271484375, -499.80767822265625, -480.3871154785156, -460.966552734375, -441.5459899902344, -422.12542724609375, -402.7048645019531, -383.2843017578125, -363.8637390136719, -344.44317626953125, -325.0226135253906, -305.60205078125, -286.1814880371094, -266.76092529296875, -247.34036254882812, -227.9197998046875, -208.49923706054688, -189.07867431640625, -169.65811157226562, -150.23760986328125, -130.81704711914062, -111.396484375, -91.97592163085938, -72.55535888671875, -53.134796142578125, -33.7142333984375, -14.293670654296875, 5.12689208984375, 24.547454833984375, 43.968017578125, 63.388580322265625, 82.80914306640625, 102.22970581054688, 121.6502685546875, 141.07083129882812, 160.49139404296875, 179.91195678710938, 199.33251953125, 218.75308227539062, 238.17364501953125, 257.5942077636719, 277.0147705078125, 296.4353332519531, 315.85589599609375, 335.2764587402344, 354.697021484375, 374.1175842285156, 393.53814697265625, 412.9587097167969, 432.3792724609375, 451.7998352050781, 471.22039794921875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 1.0, 5.0, 7.0, 8.0, 13.0, 15.0, 17.0, 16.0, 29.0, 18.0, 30.0, 27.0, 29.0, 40.0, 44.0, 46.0, 44.0, 45.0, 42.0, 44.0, 60.0, 47.0, 43.0, 39.0, 36.0, 40.0, 39.0, 34.0, 22.0, 26.0, 19.0, 14.0, 14.0, 9.0, 8.0, 13.0, 4.0, 8.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-292.1580810546875, -284.7128601074219, -277.26763916015625, -269.8224182128906, -262.377197265625, -254.93199157714844, -247.4867706298828, -240.04156494140625, -232.59634399414062, -225.151123046875, -217.70590209960938, -210.2606964111328, -202.8154754638672, -195.37025451660156, -187.92503356933594, -180.47982788085938, -173.03460693359375, -165.58938598632812, -158.1441650390625, -150.69895935058594, -143.2537384033203, -135.8085174560547, -128.36329650878906, -120.91808319091797, -113.47285461425781, -106.02763366699219, -98.5824203491211, -91.13719940185547, -83.69198608398438, -76.24676513671875, -68.80154418945312, -61.35633087158203, -53.91111755371094, -46.46590042114258, -39.02068328857422, -31.575464248657227, -24.130247116088867, -16.685028076171875, -9.239810943603516, -1.7945938110351562, 5.650623321533203, 13.095840454101562, 20.541057586669922, 27.986276626586914, 35.431495666503906, 42.876712799072266, 50.321929931640625, 57.767147064208984, 65.21236419677734, 72.65758514404297, 80.10279846191406, 87.54801940917969, 94.99323272705078, 102.4384536743164, 109.8836669921875, 117.32888793945312, 124.77410888671875, 132.21932983398438, 139.66455078125, 147.10975646972656, 154.5549774169922, 162.0001983642578, 169.44541931152344, 176.890625, 184.33584594726562]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 15.0, 13.0, 21.0, 22.0, 71.0, 84.0, 157.0, 281.0, 481.0, 799.0, 1492.0, 2839.0, 5808.0, 12567.0, 30434.0, 88977.0, 388337.0, 375212.0, 86561.0, 30069.0, 12436.0, 5687.0, 2718.0, 1528.0, 818.0, 477.0, 254.0, 144.0, 89.0, 71.0, 30.0, 22.0, 17.0, 10.0, 9.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.28125, -35.94921875, -34.6171875, -33.28515625, -31.953125, -30.62109375, -29.2890625, -27.95703125, -26.625, -25.29296875, -23.9609375, -22.62890625, -21.296875, -19.96484375, -18.6328125, -17.30078125, -15.96875, -14.63671875, -13.3046875, -11.97265625, -10.640625, -9.30859375, -7.9765625, -6.64453125, -5.3125, -3.98046875, -2.6484375, -1.31640625, 0.015625, 1.34765625, 2.6796875, 4.01171875, 5.34375, 6.67578125, 8.0078125, 9.33984375, 10.671875, 12.00390625, 13.3359375, 14.66796875, 16.0, 17.33203125, 18.6640625, 19.99609375, 21.328125, 22.66015625, 23.9921875, 25.32421875, 26.65625, 27.98828125, 29.3203125, 30.65234375, 31.984375, 33.31640625, 34.6484375, 35.98046875, 37.3125, 38.64453125, 39.9765625, 41.30859375, 42.640625, 43.97265625, 45.3046875, 46.63671875, 47.96875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 5.0, 4.0, 4.0, 15.0, 7.0, 12.0, 14.0, 12.0, 16.0, 20.0, 27.0, 26.0, 32.0, 37.0, 33.0, 42.0, 29.0, 51.0, 55.0, 47.0, 42.0, 47.0, 47.0, 42.0, 37.0, 41.0, 36.0, 29.0, 28.0, 19.0, 24.0, 19.0, 17.0, 10.0, 16.0, 12.0, 5.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-17.28125, -16.773193359375, -16.26513671875, -15.757080078125, -15.2490234375, -14.740966796875, -14.23291015625, -13.724853515625, -13.216796875, -12.708740234375, -12.20068359375, -11.692626953125, -11.1845703125, -10.676513671875, -10.16845703125, -9.660400390625, -9.15234375, -8.644287109375, -8.13623046875, -7.628173828125, -7.1201171875, -6.612060546875, -6.10400390625, -5.595947265625, -5.087890625, -4.579833984375, -4.07177734375, -3.563720703125, -3.0556640625, -2.547607421875, -2.03955078125, -1.531494140625, -1.0234375, -0.515380859375, -0.00732421875, 0.500732421875, 1.0087890625, 1.516845703125, 2.02490234375, 2.532958984375, 3.041015625, 3.549072265625, 4.05712890625, 4.565185546875, 5.0732421875, 5.581298828125, 6.08935546875, 6.597412109375, 7.10546875, 7.613525390625, 8.12158203125, 8.629638671875, 9.1376953125, 9.645751953125, 10.15380859375, 10.661865234375, 11.169921875, 11.677978515625, 12.18603515625, 12.694091796875, 13.2021484375, 13.710205078125, 14.21826171875, 14.726318359375, 15.234375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 8.0, 13.0, 17.0, 19.0, 36.0, 55.0, 86.0, 161.0, 282.0, 567.0, 1296.0, 3565.0, 15903.0, 197851.0, 784681.0, 34439.0, 5978.0, 1943.0, 776.0, 380.0, 166.0, 116.0, 77.0, 44.0, 25.0, 18.0, 13.0, 8.0, 6.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.5, -100.79296875, -97.0859375, -93.37890625, -89.671875, -85.96484375, -82.2578125, -78.55078125, -74.84375, -71.13671875, -67.4296875, -63.72265625, -60.015625, -56.30859375, -52.6015625, -48.89453125, -45.1875, -41.48046875, -37.7734375, -34.06640625, -30.359375, -26.65234375, -22.9453125, -19.23828125, -15.53125, -11.82421875, -8.1171875, -4.41015625, -0.703125, 3.00390625, 6.7109375, 10.41796875, 14.125, 17.83203125, 21.5390625, 25.24609375, 28.953125, 32.66015625, 36.3671875, 40.07421875, 43.78125, 47.48828125, 51.1953125, 54.90234375, 58.609375, 62.31640625, 66.0234375, 69.73046875, 73.4375, 77.14453125, 80.8515625, 84.55859375, 88.265625, 91.97265625, 95.6796875, 99.38671875, 103.09375, 106.80078125, 110.5078125, 114.21484375, 117.921875, 121.62890625, 125.3359375, 129.04296875, 132.75]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 10.0, 14.0, 14.0, 17.0, 32.0, 24.0, 35.0, 39.0, 45.0, 48.0, 64.0, 57.0, 55.0, 65.0, 67.0, 59.0, 49.0, 53.0, 41.0, 39.0, 29.0, 35.0, 18.0, 25.0, 11.0, 10.0, 4.0, 5.0, 3.0, 0.0, 7.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-116.4375, -113.2392578125, -110.041015625, -106.8427734375, -103.64453125, -100.4462890625, -97.248046875, -94.0498046875, -90.8515625, -87.6533203125, -84.455078125, -81.2568359375, -78.05859375, -74.8603515625, -71.662109375, -68.4638671875, -65.265625, -62.0673828125, -58.869140625, -55.6708984375, -52.47265625, -49.2744140625, -46.076171875, -42.8779296875, -39.6796875, -36.4814453125, -33.283203125, -30.0849609375, -26.88671875, -23.6884765625, -20.490234375, -17.2919921875, -14.09375, -10.8955078125, -7.697265625, -4.4990234375, -1.30078125, 1.8974609375, 5.095703125, 8.2939453125, 11.4921875, 14.6904296875, 17.888671875, 21.0869140625, 24.28515625, 27.4833984375, 30.681640625, 33.8798828125, 37.078125, 40.2763671875, 43.474609375, 46.6728515625, 49.87109375, 53.0693359375, 56.267578125, 59.4658203125, 62.6640625, 65.8623046875, 69.060546875, 72.2587890625, 75.45703125, 78.6552734375, 81.853515625, 85.0517578125, 88.25]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 7.0, 4.0, 9.0, 17.0, 16.0, 25.0, 31.0, 87.0, 170.0, 362.0, 1176.0, 4504.0, 32422.0, 773799.0, 218079.0, 13957.0, 2570.0, 741.0, 277.0, 133.0, 79.0, 33.0, 18.0, 11.0, 6.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.96875, -51.13037109375, -49.2919921875, -47.45361328125, -45.615234375, -43.77685546875, -41.9384765625, -40.10009765625, -38.26171875, -36.42333984375, -34.5849609375, -32.74658203125, -30.908203125, -29.06982421875, -27.2314453125, -25.39306640625, -23.5546875, -21.71630859375, -19.8779296875, -18.03955078125, -16.201171875, -14.36279296875, -12.5244140625, -10.68603515625, -8.84765625, -7.00927734375, -5.1708984375, -3.33251953125, -1.494140625, 0.34423828125, 2.1826171875, 4.02099609375, 5.859375, 7.69775390625, 9.5361328125, 11.37451171875, 13.212890625, 15.05126953125, 16.8896484375, 18.72802734375, 20.56640625, 22.40478515625, 24.2431640625, 26.08154296875, 27.919921875, 29.75830078125, 31.5966796875, 33.43505859375, 35.2734375, 37.11181640625, 38.9501953125, 40.78857421875, 42.626953125, 44.46533203125, 46.3037109375, 48.14208984375, 49.98046875, 51.81884765625, 53.6572265625, 55.49560546875, 57.333984375, 59.17236328125, 61.0107421875, 62.84912109375, 64.6875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 5.0, 2.0, 10.0, 13.0, 13.0, 22.0, 29.0, 48.0, 71.0, 151.0, 190.0, 170.0, 90.0, 51.0, 48.0, 31.0, 15.0, 11.0, 6.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01163482666015625, -0.011334061622619629, -0.011033296585083008, -0.010732531547546387, -0.010431766510009766, -0.010131001472473145, -0.009830236434936523, -0.009529471397399902, -0.009228706359863281, -0.00892794132232666, -0.008627176284790039, -0.008326411247253418, -0.008025646209716797, -0.007724881172180176, -0.007424116134643555, -0.007123351097106934, -0.0068225860595703125, -0.006521821022033691, -0.00622105598449707, -0.005920290946960449, -0.005619525909423828, -0.005318760871887207, -0.005017995834350586, -0.004717230796813965, -0.004416465759277344, -0.004115700721740723, -0.0038149356842041016, -0.0035141706466674805, -0.0032134056091308594, -0.0029126405715942383, -0.002611875534057617, -0.002311110496520996, -0.002010345458984375, -0.001709580421447754, -0.0014088153839111328, -0.0011080503463745117, -0.0008072853088378906, -0.0005065202713012695, -0.00020575523376464844, 9.500980377197266e-05, 0.00039577484130859375, 0.0006965398788452148, 0.000997304916381836, 0.001298069953918457, 0.0015988349914550781, 0.0018996000289916992, 0.0022003650665283203, 0.0025011301040649414, 0.0028018951416015625, 0.0031026601791381836, 0.0034034252166748047, 0.0037041902542114258, 0.004004955291748047, 0.004305720329284668, 0.004606485366821289, 0.00490725040435791, 0.005208015441894531, 0.005508780479431152, 0.0058095455169677734, 0.0061103105545043945, 0.006411075592041016, 0.006711840629577637, 0.007012605667114258, 0.007313370704650879, 0.0076141357421875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 11.0, 26.0, 18.0, 33.0, 76.0, 111.0, 197.0, 443.0, 1131.0, 3418.0, 16240.0, 221641.0, 757917.0, 38268.0, 6009.0, 1660.0, 695.0, 266.0, 157.0, 87.0, 52.0, 30.0, 25.0, 15.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.40625, -53.7861328125, -52.166015625, -50.5458984375, -48.92578125, -47.3056640625, -45.685546875, -44.0654296875, -42.4453125, -40.8251953125, -39.205078125, -37.5849609375, -35.96484375, -34.3447265625, -32.724609375, -31.1044921875, -29.484375, -27.8642578125, -26.244140625, -24.6240234375, -23.00390625, -21.3837890625, -19.763671875, -18.1435546875, -16.5234375, -14.9033203125, -13.283203125, -11.6630859375, -10.04296875, -8.4228515625, -6.802734375, -5.1826171875, -3.5625, -1.9423828125, -0.322265625, 1.2978515625, 2.91796875, 4.5380859375, 6.158203125, 7.7783203125, 9.3984375, 11.0185546875, 12.638671875, 14.2587890625, 15.87890625, 17.4990234375, 19.119140625, 20.7392578125, 22.359375, 23.9794921875, 25.599609375, 27.2197265625, 28.83984375, 30.4599609375, 32.080078125, 33.7001953125, 35.3203125, 36.9404296875, 38.560546875, 40.1806640625, 41.80078125, 43.4208984375, 45.041015625, 46.6611328125, 48.28125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 1.0, 5.0, 9.0, 7.0, 8.0, 12.0, 19.0, 29.0, 22.0, 36.0, 40.0, 62.0, 49.0, 92.0, 100.0, 97.0, 77.0, 69.0, 67.0, 38.0, 29.0, 28.0, 20.0, 22.0, 12.0, 16.0, 7.0, 6.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.109375, -23.212158203125, -22.31494140625, -21.417724609375, -20.5205078125, -19.623291015625, -18.72607421875, -17.828857421875, -16.931640625, -16.034423828125, -15.13720703125, -14.239990234375, -13.3427734375, -12.445556640625, -11.54833984375, -10.651123046875, -9.75390625, -8.856689453125, -7.95947265625, -7.062255859375, -6.1650390625, -5.267822265625, -4.37060546875, -3.473388671875, -2.576171875, -1.678955078125, -0.78173828125, 0.115478515625, 1.0126953125, 1.909912109375, 2.80712890625, 3.704345703125, 4.6015625, 5.498779296875, 6.39599609375, 7.293212890625, 8.1904296875, 9.087646484375, 9.98486328125, 10.882080078125, 11.779296875, 12.676513671875, 13.57373046875, 14.470947265625, 15.3681640625, 16.265380859375, 17.16259765625, 18.059814453125, 18.95703125, 19.854248046875, 20.75146484375, 21.648681640625, 22.5458984375, 23.443115234375, 24.34033203125, 25.237548828125, 26.134765625, 27.031982421875, 27.92919921875, 28.826416015625, 29.7236328125, 30.620849609375, 31.51806640625, 32.415283203125, 33.3125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 9.0, 4.0, 10.0, 25.0, 37.0, 78.0, 103.0, 133.0, 192.0, 136.0, 116.0, 62.0, 37.0, 19.0, 9.0, 7.0, 7.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-581.22021484375, -565.3141479492188, -549.4081420898438, -533.5020751953125, -517.5960083007812, -501.6899719238281, -485.783935546875, -469.87786865234375, -453.9718322753906, -438.0657958984375, -422.15972900390625, -406.2536926269531, -390.34765625, -374.44158935546875, -358.5355529785156, -342.6295166015625, -326.72344970703125, -310.8174133300781, -294.9113464355469, -279.00531005859375, -263.0992431640625, -247.19320678710938, -231.28717041015625, -215.38111877441406, -199.47506713867188, -183.5690155029297, -167.6629638671875, -151.75692749023438, -135.8508758544922, -119.94482421875, -104.03878021240234, -88.13273620605469, -72.22665405273438, -56.32060623168945, -40.41455841064453, -24.50851058959961, -8.602462768554688, 7.3035888671875, 23.209632873535156, 39.11567687988281, 55.021728515625, 70.92778015136719, 86.83382415771484, 102.7398681640625, 118.64591979980469, 134.55197143554688, 150.4580078125, 166.3640594482422, 182.27011108398438, 198.17616271972656, 214.08221435546875, 229.98825073242188, 245.89430236816406, 261.80035400390625, 277.7063903808594, 293.6124267578125, 309.51849365234375, 325.4245300292969, 341.3305969238281, 357.23663330078125, 373.1427001953125, 389.0487365722656, 404.95477294921875, 420.86083984375, 436.7668762207031]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 5.0, 12.0, 19.0, 32.0, 23.0, 38.0, 41.0, 63.0, 58.0, 81.0, 97.0, 111.0, 86.0, 75.0, 57.0, 55.0, 36.0, 33.0, 26.0, 16.0, 12.0, 9.0, 5.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.8760986328125, -330.5126037597656, -312.14910888671875, -293.78558349609375, -275.4220886230469, -257.05859375, -238.69508361816406, -220.33157348632812, -201.96807861328125, -183.60458374023438, -165.24107360839844, -146.8775634765625, -128.51406860351562, -110.15056610107422, -91.78706359863281, -73.42355346679688, -55.06005859375, -36.696556091308594, -18.333053588867188, 0.03044891357421875, 18.393951416015625, 36.75745391845703, 55.12095642089844, 73.48446655273438, 91.84796142578125, 110.21146392822266, 128.57496643066406, 146.9384765625, 165.30197143554688, 183.66546630859375, 202.0289764404297, 220.39248657226562, 238.7559814453125, 257.1194763183594, 275.48297119140625, 293.84649658203125, 312.2099914550781, 330.573486328125, 348.93701171875, 367.3005065917969, 385.66400146484375, 404.0274963378906, 422.3909912109375, 440.7545166015625, 459.1180114746094, 477.48150634765625, 495.84503173828125, 514.20849609375, 532.572021484375, 550.935546875, 569.2990112304688, 587.6625366210938, 606.0260009765625, 624.3895263671875, 642.7530517578125, 661.1165771484375, 679.4800415039062, 697.8435668945312, 716.20703125, 734.570556640625, 752.93408203125, 771.2975463867188, 789.6610717773438, 808.0245361328125, 826.3880615234375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 11.0, 15.0, 22.0, 39.0, 42.0, 79.0, 114.0, 142.0, 218.0, 346.0, 586.0, 1021.0, 1730.0, 3235.0, 6401.0, 13707.0, 35138.0, 119550.0, 690551.0, 2489723.0, 658181.0, 115674.0, 33125.0, 12710.0, 5489.0, 2751.0, 1391.0, 840.0, 476.0, 319.0, 192.0, 123.0, 99.0, 70.0, 37.0, 28.0, 27.0, 16.0, 11.0, 7.0, 12.0, 4.0, 5.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.609375, -24.710205078125, -23.81103515625, -22.911865234375, -22.0126953125, -21.113525390625, -20.21435546875, -19.315185546875, -18.416015625, -17.516845703125, -16.61767578125, -15.718505859375, -14.8193359375, -13.920166015625, -13.02099609375, -12.121826171875, -11.22265625, -10.323486328125, -9.42431640625, -8.525146484375, -7.6259765625, -6.726806640625, -5.82763671875, -4.928466796875, -4.029296875, -3.130126953125, -2.23095703125, -1.331787109375, -0.4326171875, 0.466552734375, 1.36572265625, 2.264892578125, 3.1640625, 4.063232421875, 4.96240234375, 5.861572265625, 6.7607421875, 7.659912109375, 8.55908203125, 9.458251953125, 10.357421875, 11.256591796875, 12.15576171875, 13.054931640625, 13.9541015625, 14.853271484375, 15.75244140625, 16.651611328125, 17.55078125, 18.449951171875, 19.34912109375, 20.248291015625, 21.1474609375, 22.046630859375, 22.94580078125, 23.844970703125, 24.744140625, 25.643310546875, 26.54248046875, 27.441650390625, 28.3408203125, 29.239990234375, 30.13916015625, 31.038330078125, 31.9375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 16.0, 29.0, 66.0, 63.0, 108.0, 146.0, 166.0, 147.0, 102.0, 70.0, 55.0, 12.0, 8.0, 10.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.5625, -24.9462890625, -23.330078125, -21.7138671875, -20.09765625, -18.4814453125, -16.865234375, -15.2490234375, -13.6328125, -12.0166015625, -10.400390625, -8.7841796875, -7.16796875, -5.5517578125, -3.935546875, -2.3193359375, -0.703125, 0.9130859375, 2.529296875, 4.1455078125, 5.76171875, 7.3779296875, 8.994140625, 10.6103515625, 12.2265625, 13.8427734375, 15.458984375, 17.0751953125, 18.69140625, 20.3076171875, 21.923828125, 23.5400390625, 25.15625, 26.7724609375, 28.388671875, 30.0048828125, 31.62109375, 33.2373046875, 34.853515625, 36.4697265625, 38.0859375, 39.7021484375, 41.318359375, 42.9345703125, 44.55078125, 46.1669921875, 47.783203125, 49.3994140625, 51.015625, 52.6318359375, 54.248046875, 55.8642578125, 57.48046875, 59.0966796875, 60.712890625, 62.3291015625, 63.9453125, 65.5615234375, 67.177734375, 68.7939453125, 70.41015625, 72.0263671875, 73.642578125, 75.2587890625, 76.875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 10.0, 9.0, 16.0, 17.0, 40.0, 79.0, 93.0, 148.0, 276.0, 485.0, 986.0, 2127.0, 5675.0, 19282.0, 104835.0, 2070930.0, 1870441.0, 92691.0, 17025.0, 4920.0, 1994.0, 959.0, 513.0, 291.0, 169.0, 96.0, 51.0, 32.0, 35.0, 14.0, 10.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-70.8125, -68.5986328125, -66.384765625, -64.1708984375, -61.95703125, -59.7431640625, -57.529296875, -55.3154296875, -53.1015625, -50.8876953125, -48.673828125, -46.4599609375, -44.24609375, -42.0322265625, -39.818359375, -37.6044921875, -35.390625, -33.1767578125, -30.962890625, -28.7490234375, -26.53515625, -24.3212890625, -22.107421875, -19.8935546875, -17.6796875, -15.4658203125, -13.251953125, -11.0380859375, -8.82421875, -6.6103515625, -4.396484375, -2.1826171875, 0.03125, 2.2451171875, 4.458984375, 6.6728515625, 8.88671875, 11.1005859375, 13.314453125, 15.5283203125, 17.7421875, 19.9560546875, 22.169921875, 24.3837890625, 26.59765625, 28.8115234375, 31.025390625, 33.2392578125, 35.453125, 37.6669921875, 39.880859375, 42.0947265625, 44.30859375, 46.5224609375, 48.736328125, 50.9501953125, 53.1640625, 55.3779296875, 57.591796875, 59.8056640625, 62.01953125, 64.2333984375, 66.447265625, 68.6611328125, 70.875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 7.0, 4.0, 12.0, 20.0, 22.0, 38.0, 41.0, 51.0, 101.0, 166.0, 245.0, 466.0, 810.0, 886.0, 507.0, 282.0, 141.0, 84.0, 46.0, 38.0, 35.0, 20.0, 12.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-81.9375, -79.3828125, -76.828125, -74.2734375, -71.71875, -69.1640625, -66.609375, -64.0546875, -61.5, -58.9453125, -56.390625, -53.8359375, -51.28125, -48.7265625, -46.171875, -43.6171875, -41.0625, -38.5078125, -35.953125, -33.3984375, -30.84375, -28.2890625, -25.734375, -23.1796875, -20.625, -18.0703125, -15.515625, -12.9609375, -10.40625, -7.8515625, -5.296875, -2.7421875, -0.1875, 2.3671875, 4.921875, 7.4765625, 10.03125, 12.5859375, 15.140625, 17.6953125, 20.25, 22.8046875, 25.359375, 27.9140625, 30.46875, 33.0234375, 35.578125, 38.1328125, 40.6875, 43.2421875, 45.796875, 48.3515625, 50.90625, 53.4609375, 56.015625, 58.5703125, 61.125, 63.6796875, 66.234375, 68.7890625, 71.34375, 73.8984375, 76.453125, 79.0078125, 81.5625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 6.0, 16.0, 20.0, 62.0, 252.0, 443.0, 152.0, 34.0, 6.0, 9.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2344.88427734375, -2297.390869140625, -2249.8974609375, -2202.40380859375, -2154.910400390625, -2107.4169921875, -2059.923583984375, -2012.4300537109375, -1964.9365234375, -1917.443115234375, -1869.9495849609375, -1822.4561767578125, -1774.962646484375, -1727.46923828125, -1679.9757080078125, -1632.4822998046875, -1584.98876953125, -1537.495361328125, -1490.0018310546875, -1442.5084228515625, -1395.014892578125, -1347.521484375, -1300.0279541015625, -1252.5345458984375, -1205.0411376953125, -1157.5477294921875, -1110.05419921875, -1062.560791015625, -1015.0672607421875, -967.5737915039062, -920.080322265625, -872.5869140625, -825.0933837890625, -777.5999145507812, -730.1064453125, -682.6129760742188, -635.1195068359375, -587.6260375976562, -540.132568359375, -492.6391296386719, -445.1456604003906, -397.6521911621094, -350.1587219238281, -302.665283203125, -255.1717987060547, -207.67832946777344, -160.18487548828125, -112.69140625, -65.19793701171875, -17.704471588134766, 29.78899383544922, 77.28245544433594, 124.77592468261719, 172.26939392089844, 219.76284790039062, 267.2563171386719, 314.7497863769531, 362.2432556152344, 409.7367248535156, 457.23016357421875, 504.7236328125, 552.2171020507812, 599.7105712890625, 647.2040405273438, 694.697509765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 16.0, 10.0, 16.0, 29.0, 35.0, 40.0, 37.0, 68.0, 59.0, 77.0, 62.0, 78.0, 74.0, 83.0, 71.0, 58.0, 44.0, 30.0, 30.0, 23.0, 17.0, 15.0, 9.0, 6.0, 1.0, 7.0, 1.0, 2.0, 4.0], "bins": [-768.7218627929688, -752.0758056640625, -735.4297485351562, -718.78369140625, -702.1376342773438, -685.4915771484375, -668.8455810546875, -652.1995239257812, -635.553466796875, -618.9074096679688, -602.2613525390625, -585.6152954101562, -568.96923828125, -552.3232421875, -535.6771240234375, -519.0311279296875, -502.3850402832031, -485.7389831542969, -469.0929260253906, -452.4468994140625, -435.80084228515625, -419.15478515625, -402.50872802734375, -385.8626708984375, -369.21661376953125, -352.570556640625, -335.92449951171875, -319.2784423828125, -302.6324157714844, -285.9863586425781, -269.3403015136719, -252.69424438476562, -236.04818725585938, -219.40213012695312, -202.75608825683594, -186.1100311279297, -169.4639892578125, -152.81793212890625, -136.171875, -119.52582550048828, -102.87977600097656, -86.23372650146484, -69.58767700195312, -52.941619873046875, -36.295570373535156, -19.649520874023438, -3.0034637451171875, 13.642585754394531, 30.28863525390625, 46.93468475341797, 63.58073806762695, 80.22679138183594, 96.87284088134766, 113.51889038085938, 130.16494750976562, 146.81100463867188, 163.45704650878906, 180.1031036376953, 196.7491455078125, 213.39520263671875, 230.041259765625, 246.6873016357422, 263.3333740234375, 279.9794006347656, 296.6254577636719]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 9.0, 18.0, 22.0, 46.0, 53.0, 75.0, 143.0, 210.0, 329.0, 432.0, 739.0, 1226.0, 1988.0, 3662.0, 6950.0, 13505.0, 27525.0, 61770.0, 157621.0, 397399.0, 223034.0, 80725.0, 35195.0, 16877.0, 8395.0, 4346.0, 2450.0, 1413.0, 843.0, 518.0, 335.0, 216.0, 147.0, 95.0, 77.0, 42.0, 31.0, 18.0, 17.0, 15.0, 12.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.78125, -36.548828125, -35.31640625, -34.083984375, -32.8515625, -31.619140625, -30.38671875, -29.154296875, -27.921875, -26.689453125, -25.45703125, -24.224609375, -22.9921875, -21.759765625, -20.52734375, -19.294921875, -18.0625, -16.830078125, -15.59765625, -14.365234375, -13.1328125, -11.900390625, -10.66796875, -9.435546875, -8.203125, -6.970703125, -5.73828125, -4.505859375, -3.2734375, -2.041015625, -0.80859375, 0.423828125, 1.65625, 2.888671875, 4.12109375, 5.353515625, 6.5859375, 7.818359375, 9.05078125, 10.283203125, 11.515625, 12.748046875, 13.98046875, 15.212890625, 16.4453125, 17.677734375, 18.91015625, 20.142578125, 21.375, 22.607421875, 23.83984375, 25.072265625, 26.3046875, 27.537109375, 28.76953125, 30.001953125, 31.234375, 32.466796875, 33.69921875, 34.931640625, 36.1640625, 37.396484375, 38.62890625, 39.861328125, 41.09375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 7.0, 11.0, 10.0, 13.0, 11.0, 16.0, 21.0, 21.0, 19.0, 32.0, 30.0, 32.0, 38.0, 30.0, 36.0, 40.0, 54.0, 50.0, 53.0, 57.0, 39.0, 46.0, 49.0, 38.0, 37.0, 38.0, 22.0, 21.0, 21.0, 21.0, 11.0, 12.0, 12.0, 5.0, 10.0, 5.0, 7.0, 1.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.40771484375, -18.8154296875, -18.22314453125, -17.630859375, -17.03857421875, -16.4462890625, -15.85400390625, -15.26171875, -14.66943359375, -14.0771484375, -13.48486328125, -12.892578125, -12.30029296875, -11.7080078125, -11.11572265625, -10.5234375, -9.93115234375, -9.3388671875, -8.74658203125, -8.154296875, -7.56201171875, -6.9697265625, -6.37744140625, -5.78515625, -5.19287109375, -4.6005859375, -4.00830078125, -3.416015625, -2.82373046875, -2.2314453125, -1.63916015625, -1.046875, -0.45458984375, 0.1376953125, 0.72998046875, 1.322265625, 1.91455078125, 2.5068359375, 3.09912109375, 3.69140625, 4.28369140625, 4.8759765625, 5.46826171875, 6.060546875, 6.65283203125, 7.2451171875, 7.83740234375, 8.4296875, 9.02197265625, 9.6142578125, 10.20654296875, 10.798828125, 11.39111328125, 11.9833984375, 12.57568359375, 13.16796875, 13.76025390625, 14.3525390625, 14.94482421875, 15.537109375, 16.12939453125, 16.7216796875, 17.31396484375, 17.90625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 7.0, 17.0, 16.0, 26.0, 49.0, 99.0, 156.0, 289.0, 586.0, 1335.0, 4069.0, 21888.0, 820438.0, 184063.0, 10758.0, 2699.0, 1031.0, 430.0, 234.0, 135.0, 83.0, 42.0, 26.0, 29.0, 10.0, 20.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-223.875, -217.95703125, -212.0390625, -206.12109375, -200.203125, -194.28515625, -188.3671875, -182.44921875, -176.53125, -170.61328125, -164.6953125, -158.77734375, -152.859375, -146.94140625, -141.0234375, -135.10546875, -129.1875, -123.26953125, -117.3515625, -111.43359375, -105.515625, -99.59765625, -93.6796875, -87.76171875, -81.84375, -75.92578125, -70.0078125, -64.08984375, -58.171875, -52.25390625, -46.3359375, -40.41796875, -34.5, -28.58203125, -22.6640625, -16.74609375, -10.828125, -4.91015625, 1.0078125, 6.92578125, 12.84375, 18.76171875, 24.6796875, 30.59765625, 36.515625, 42.43359375, 48.3515625, 54.26953125, 60.1875, 66.10546875, 72.0234375, 77.94140625, 83.859375, 89.77734375, 95.6953125, 101.61328125, 107.53125, 113.44921875, 119.3671875, 125.28515625, 131.203125, 137.12109375, 143.0390625, 148.95703125, 154.875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 14.0, 12.0, 14.0, 34.0, 28.0, 30.0, 61.0, 66.0, 67.0, 82.0, 103.0, 88.0, 63.0, 92.0, 68.0, 49.0, 29.0, 22.0, 23.0, 11.0, 13.0, 13.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.125, -111.7109375, -106.296875, -100.8828125, -95.46875, -90.0546875, -84.640625, -79.2265625, -73.8125, -68.3984375, -62.984375, -57.5703125, -52.15625, -46.7421875, -41.328125, -35.9140625, -30.5, -25.0859375, -19.671875, -14.2578125, -8.84375, -3.4296875, 1.984375, 7.3984375, 12.8125, 18.2265625, 23.640625, 29.0546875, 34.46875, 39.8828125, 45.296875, 50.7109375, 56.125, 61.5390625, 66.953125, 72.3671875, 77.78125, 83.1953125, 88.609375, 94.0234375, 99.4375, 104.8515625, 110.265625, 115.6796875, 121.09375, 126.5078125, 131.921875, 137.3359375, 142.75, 148.1640625, 153.578125, 158.9921875, 164.40625, 169.8203125, 175.234375, 180.6484375, 186.0625, 191.4765625, 196.890625, 202.3046875, 207.71875, 213.1328125, 218.546875, 223.9609375, 229.375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 2.0, 9.0, 5.0, 12.0, 20.0, 22.0, 32.0, 34.0, 56.0, 109.0, 171.0, 298.0, 533.0, 1172.0, 2727.0, 7496.0, 28580.0, 156078.0, 707177.0, 111413.0, 21843.0, 6297.0, 2265.0, 1006.0, 506.0, 279.0, 144.0, 77.0, 52.0, 37.0, 25.0, 19.0, 12.0, 8.0, 6.0, 9.0, 7.0, 3.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.984375, -27.998779296875, -27.01318359375, -26.027587890625, -25.0419921875, -24.056396484375, -23.07080078125, -22.085205078125, -21.099609375, -20.114013671875, -19.12841796875, -18.142822265625, -17.1572265625, -16.171630859375, -15.18603515625, -14.200439453125, -13.21484375, -12.229248046875, -11.24365234375, -10.258056640625, -9.2724609375, -8.286865234375, -7.30126953125, -6.315673828125, -5.330078125, -4.344482421875, -3.35888671875, -2.373291015625, -1.3876953125, -0.402099609375, 0.58349609375, 1.569091796875, 2.5546875, 3.540283203125, 4.52587890625, 5.511474609375, 6.4970703125, 7.482666015625, 8.46826171875, 9.453857421875, 10.439453125, 11.425048828125, 12.41064453125, 13.396240234375, 14.3818359375, 15.367431640625, 16.35302734375, 17.338623046875, 18.32421875, 19.309814453125, 20.29541015625, 21.281005859375, 22.2666015625, 23.252197265625, 24.23779296875, 25.223388671875, 26.208984375, 27.194580078125, 28.18017578125, 29.165771484375, 30.1513671875, 31.136962890625, 32.12255859375, 33.108154296875, 34.09375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 8.0, 7.0, 6.0, 15.0, 18.0, 19.0, 23.0, 28.0, 42.0, 40.0, 74.0, 87.0, 142.0, 129.0, 87.0, 57.0, 52.0, 33.0, 23.0, 30.0, 21.0, 17.0, 8.0, 12.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0076446533203125, -0.007371306419372559, -0.007097959518432617, -0.006824612617492676, -0.006551265716552734, -0.006277918815612793, -0.0060045719146728516, -0.00573122501373291, -0.005457878112792969, -0.005184531211853027, -0.004911184310913086, -0.0046378374099731445, -0.004364490509033203, -0.004091143608093262, -0.0038177967071533203, -0.003544449806213379, -0.0032711029052734375, -0.002997756004333496, -0.0027244091033935547, -0.0024510622024536133, -0.002177715301513672, -0.0019043684005737305, -0.001631021499633789, -0.0013576745986938477, -0.0010843276977539062, -0.0008109807968139648, -0.0005376338958740234, -0.00026428699493408203, 9.059906005859375e-06, 0.0002824068069458008, 0.0005557537078857422, 0.0008291006088256836, 0.001102447509765625, 0.0013757944107055664, 0.0016491413116455078, 0.0019224882125854492, 0.0021958351135253906, 0.002469182014465332, 0.0027425289154052734, 0.003015875816345215, 0.0032892227172851562, 0.0035625696182250977, 0.003835916519165039, 0.0041092634201049805, 0.004382610321044922, 0.004655957221984863, 0.004929304122924805, 0.005202651023864746, 0.0054759979248046875, 0.005749344825744629, 0.00602269172668457, 0.006296038627624512, 0.006569385528564453, 0.0068427324295043945, 0.007116079330444336, 0.007389426231384277, 0.007662773132324219, 0.00793612003326416, 0.008209466934204102, 0.008482813835144043, 0.008756160736083984, 0.009029507637023926, 0.009302854537963867, 0.009576201438903809, 0.00984954833984375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 1.0, 4.0, 5.0, 11.0, 16.0, 28.0, 32.0, 43.0, 72.0, 98.0, 172.0, 334.0, 592.0, 1101.0, 2331.0, 5661.0, 23373.0, 192252.0, 731386.0, 71842.0, 11890.0, 3731.0, 1656.0, 790.0, 457.0, 257.0, 148.0, 105.0, 62.0, 31.0, 26.0, 22.0, 6.0, 7.0, 7.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.5, -38.440673828125, -37.38134765625, -36.322021484375, -35.2626953125, -34.203369140625, -33.14404296875, -32.084716796875, -31.025390625, -29.966064453125, -28.90673828125, -27.847412109375, -26.7880859375, -25.728759765625, -24.66943359375, -23.610107421875, -22.55078125, -21.491455078125, -20.43212890625, -19.372802734375, -18.3134765625, -17.254150390625, -16.19482421875, -15.135498046875, -14.076171875, -13.016845703125, -11.95751953125, -10.898193359375, -9.8388671875, -8.779541015625, -7.72021484375, -6.660888671875, -5.6015625, -4.542236328125, -3.48291015625, -2.423583984375, -1.3642578125, -0.304931640625, 0.75439453125, 1.813720703125, 2.873046875, 3.932373046875, 4.99169921875, 6.051025390625, 7.1103515625, 8.169677734375, 9.22900390625, 10.288330078125, 11.34765625, 12.406982421875, 13.46630859375, 14.525634765625, 15.5849609375, 16.644287109375, 17.70361328125, 18.762939453125, 19.822265625, 20.881591796875, 21.94091796875, 23.000244140625, 24.0595703125, 25.118896484375, 26.17822265625, 27.237548828125, 28.296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 8.0, 17.0, 18.0, 15.0, 26.0, 30.0, 32.0, 30.0, 42.0, 46.0, 60.0, 66.0, 65.0, 82.0, 62.0, 65.0, 67.0, 38.0, 38.0, 26.0, 31.0, 20.0, 23.0, 22.0, 10.0, 5.0, 9.0, 3.0, 3.0, 5.0, 2.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.054931640625, -20.25048828125, -19.446044921875, -18.6416015625, -17.837158203125, -17.03271484375, -16.228271484375, -15.423828125, -14.619384765625, -13.81494140625, -13.010498046875, -12.2060546875, -11.401611328125, -10.59716796875, -9.792724609375, -8.98828125, -8.183837890625, -7.37939453125, -6.574951171875, -5.7705078125, -4.966064453125, -4.16162109375, -3.357177734375, -2.552734375, -1.748291015625, -0.94384765625, -0.139404296875, 0.6650390625, 1.469482421875, 2.27392578125, 3.078369140625, 3.8828125, 4.687255859375, 5.49169921875, 6.296142578125, 7.1005859375, 7.905029296875, 8.70947265625, 9.513916015625, 10.318359375, 11.122802734375, 11.92724609375, 12.731689453125, 13.5361328125, 14.340576171875, 15.14501953125, 15.949462890625, 16.75390625, 17.558349609375, 18.36279296875, 19.167236328125, 19.9716796875, 20.776123046875, 21.58056640625, 22.385009765625, 23.189453125, 23.993896484375, 24.79833984375, 25.602783203125, 26.4072265625, 27.211669921875, 28.01611328125, 28.820556640625, 29.625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 19.0, 22.0, 46.0, 91.0, 154.0, 277.0, 192.0, 89.0, 46.0, 26.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1310.2720947265625, -1283.4244384765625, -1256.57666015625, -1229.72900390625, -1202.88134765625, -1176.03369140625, -1149.1859130859375, -1122.3382568359375, -1095.4906005859375, -1068.6429443359375, -1041.795166015625, -1014.947509765625, -988.099853515625, -961.2521362304688, -934.4044799804688, -907.5567626953125, -880.7091064453125, -853.8613891601562, -827.0137329101562, -800.166015625, -773.318359375, -746.4706420898438, -719.6229858398438, -692.7752685546875, -665.9275512695312, -639.079833984375, -612.232177734375, -585.3844604492188, -558.5368041992188, -531.6890869140625, -504.8414306640625, -477.99371337890625, -451.14605712890625, -424.2983703613281, -397.45068359375, -370.6029968261719, -343.75531005859375, -316.9075927734375, -290.0599365234375, -263.21221923828125, -236.3645477294922, -209.51686096191406, -182.66917419433594, -155.82147216796875, -128.97378540039062, -102.1260986328125, -75.27841186523438, -48.43072509765625, -21.583038330078125, 5.264650344848633, 32.11233901977539, 58.96002960205078, 85.8077163696289, 112.65541076660156, 139.5030975341797, 166.3507843017578, 193.19847106933594, 220.04615783691406, 246.8938446044922, 273.7415466308594, 300.5892333984375, 327.4369201660156, 354.28460693359375, 381.1322937011719, 407.97998046875]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 12.0, 6.0, 6.0, 10.0, 8.0, 11.0, 9.0, 18.0, 19.0, 23.0, 23.0, 27.0, 27.0, 45.0, 41.0, 38.0, 63.0, 69.0, 71.0, 59.0, 51.0, 52.0, 39.0, 36.0, 22.0, 28.0, 21.0, 10.0, 23.0, 17.0, 15.0, 14.0, 12.0, 13.0, 12.0, 11.0, 11.0, 3.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-369.5523681640625, -358.8501281738281, -348.14788818359375, -337.4456481933594, -326.743408203125, -316.0411682128906, -305.33892822265625, -294.6366882324219, -283.9344482421875, -273.2322082519531, -262.52996826171875, -251.82772827148438, -241.12548828125, -230.42324829101562, -219.72100830078125, -209.01876831054688, -198.31651306152344, -187.61427307128906, -176.9120330810547, -166.2097930908203, -155.50755310058594, -144.80531311035156, -134.10305786132812, -123.40082550048828, -112.6985855102539, -101.99634552001953, -91.29410552978516, -80.59185791015625, -69.88961791992188, -59.187381744384766, -48.485137939453125, -37.78289794921875, -27.080657958984375, -16.37841796875, -5.676176071166992, 5.026065826416016, 15.72830581665039, 26.430545806884766, 37.132789611816406, 47.83502960205078, 58.537269592285156, 69.23950958251953, 79.9417495727539, 90.64399719238281, 101.34623718261719, 112.04847717285156, 122.75071716308594, 133.4529571533203, 144.1551971435547, 154.85743713378906, 165.55967712402344, 176.2619171142578, 186.9641571044922, 197.66639709472656, 208.36865234375, 219.07089233398438, 229.77313232421875, 240.47537231445312, 251.1776123046875, 261.8798522949219, 272.58209228515625, 283.2843322753906, 293.986572265625, 304.6888122558594, 315.39105224609375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 13.0, 21.0, 27.0, 32.0, 48.0, 88.0, 142.0, 229.0, 439.0, 718.0, 1244.0, 2454.0, 4925.0, 10668.0, 25374.0, 74736.0, 320955.0, 1724673.0, 1609009.0, 297837.0, 73443.0, 25463.0, 10979.0, 5045.0, 2519.0, 1326.0, 761.0, 432.0, 248.0, 137.0, 107.0, 75.0, 37.0, 26.0, 17.0, 13.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.21875, -23.383056640625, -22.54736328125, -21.711669921875, -20.8759765625, -20.040283203125, -19.20458984375, -18.368896484375, -17.533203125, -16.697509765625, -15.86181640625, -15.026123046875, -14.1904296875, -13.354736328125, -12.51904296875, -11.683349609375, -10.84765625, -10.011962890625, -9.17626953125, -8.340576171875, -7.5048828125, -6.669189453125, -5.83349609375, -4.997802734375, -4.162109375, -3.326416015625, -2.49072265625, -1.655029296875, -0.8193359375, 0.016357421875, 0.85205078125, 1.687744140625, 2.5234375, 3.359130859375, 4.19482421875, 5.030517578125, 5.8662109375, 6.701904296875, 7.53759765625, 8.373291015625, 9.208984375, 10.044677734375, 10.88037109375, 11.716064453125, 12.5517578125, 13.387451171875, 14.22314453125, 15.058837890625, 15.89453125, 16.730224609375, 17.56591796875, 18.401611328125, 19.2373046875, 20.072998046875, 20.90869140625, 21.744384765625, 22.580078125, 23.415771484375, 24.25146484375, 25.087158203125, 25.9228515625, 26.758544921875, 27.59423828125, 28.429931640625, 29.265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 12.0, 7.0, 6.0, 10.0, 14.0, 19.0, 29.0, 26.0, 30.0, 42.0, 40.0, 52.0, 52.0, 61.0, 54.0, 70.0, 43.0, 52.0, 56.0, 62.0, 41.0, 35.0, 36.0, 26.0, 35.0, 15.0, 17.0, 21.0, 11.0, 3.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.15625, -28.43408203125, -27.7119140625, -26.98974609375, -26.267578125, -25.54541015625, -24.8232421875, -24.10107421875, -23.37890625, -22.65673828125, -21.9345703125, -21.21240234375, -20.490234375, -19.76806640625, -19.0458984375, -18.32373046875, -17.6015625, -16.87939453125, -16.1572265625, -15.43505859375, -14.712890625, -13.99072265625, -13.2685546875, -12.54638671875, -11.82421875, -11.10205078125, -10.3798828125, -9.65771484375, -8.935546875, -8.21337890625, -7.4912109375, -6.76904296875, -6.046875, -5.32470703125, -4.6025390625, -3.88037109375, -3.158203125, -2.43603515625, -1.7138671875, -0.99169921875, -0.26953125, 0.45263671875, 1.1748046875, 1.89697265625, 2.619140625, 3.34130859375, 4.0634765625, 4.78564453125, 5.5078125, 6.22998046875, 6.9521484375, 7.67431640625, 8.396484375, 9.11865234375, 9.8408203125, 10.56298828125, 11.28515625, 12.00732421875, 12.7294921875, 13.45166015625, 14.173828125, 14.89599609375, 15.6181640625, 16.34033203125, 17.0625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 5.0, 10.0, 15.0, 22.0, 28.0, 44.0, 55.0, 73.0, 144.0, 195.0, 393.0, 643.0, 1219.0, 2602.0, 6076.0, 18402.0, 77119.0, 687221.0, 3048363.0, 281304.0, 48537.0, 13102.0, 4454.0, 1977.0, 938.0, 508.0, 309.0, 165.0, 118.0, 83.0, 39.0, 32.0, 18.0, 13.0, 14.0, 7.0, 9.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.15625, -56.23876953125, -54.3212890625, -52.40380859375, -50.486328125, -48.56884765625, -46.6513671875, -44.73388671875, -42.81640625, -40.89892578125, -38.9814453125, -37.06396484375, -35.146484375, -33.22900390625, -31.3115234375, -29.39404296875, -27.4765625, -25.55908203125, -23.6416015625, -21.72412109375, -19.806640625, -17.88916015625, -15.9716796875, -14.05419921875, -12.13671875, -10.21923828125, -8.3017578125, -6.38427734375, -4.466796875, -2.54931640625, -0.6318359375, 1.28564453125, 3.203125, 5.12060546875, 7.0380859375, 8.95556640625, 10.873046875, 12.79052734375, 14.7080078125, 16.62548828125, 18.54296875, 20.46044921875, 22.3779296875, 24.29541015625, 26.212890625, 28.13037109375, 30.0478515625, 31.96533203125, 33.8828125, 35.80029296875, 37.7177734375, 39.63525390625, 41.552734375, 43.47021484375, 45.3876953125, 47.30517578125, 49.22265625, 51.14013671875, 53.0576171875, 54.97509765625, 56.892578125, 58.81005859375, 60.7275390625, 62.64501953125, 64.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 6.0, 11.0, 20.0, 27.0, 49.0, 54.0, 101.0, 190.0, 366.0, 704.0, 897.0, 693.0, 383.0, 186.0, 116.0, 87.0, 54.0, 42.0, 21.0, 14.0, 14.0, 6.0, 10.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.375, -88.48046875, -85.5859375, -82.69140625, -79.796875, -76.90234375, -74.0078125, -71.11328125, -68.21875, -65.32421875, -62.4296875, -59.53515625, -56.640625, -53.74609375, -50.8515625, -47.95703125, -45.0625, -42.16796875, -39.2734375, -36.37890625, -33.484375, -30.58984375, -27.6953125, -24.80078125, -21.90625, -19.01171875, -16.1171875, -13.22265625, -10.328125, -7.43359375, -4.5390625, -1.64453125, 1.25, 4.14453125, 7.0390625, 9.93359375, 12.828125, 15.72265625, 18.6171875, 21.51171875, 24.40625, 27.30078125, 30.1953125, 33.08984375, 35.984375, 38.87890625, 41.7734375, 44.66796875, 47.5625, 50.45703125, 53.3515625, 56.24609375, 59.140625, 62.03515625, 64.9296875, 67.82421875, 70.71875, 73.61328125, 76.5078125, 79.40234375, 82.296875, 85.19140625, 88.0859375, 90.98046875, 93.875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 18.0, 82.0, 389.0, 379.0, 95.0, 16.0, 5.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2836.4833984375, -2778.592529296875, -2720.701904296875, -2662.81103515625, -2604.920166015625, -2547.029541015625, -2489.138671875, -2431.247802734375, -2373.357177734375, -2315.46630859375, -2257.57568359375, -2199.684814453125, -2141.7939453125, -2083.9033203125, -2026.012451171875, -1968.1217041015625, -1910.2308349609375, -1852.340087890625, -1794.44921875, -1736.5584716796875, -1678.667724609375, -1620.77685546875, -1562.8861083984375, -1504.995361328125, -1447.1044921875, -1389.2137451171875, -1331.3228759765625, -1273.43212890625, -1215.5413818359375, -1157.650634765625, -1099.759765625, -1041.8690185546875, -983.9781494140625, -926.0873413085938, -868.1965942382812, -810.3057861328125, -752.4150390625, -694.5242309570312, -636.6334228515625, -578.74267578125, -520.8518676757812, -462.9610900878906, -405.0703125, -347.17950439453125, -289.2887268066406, -231.39794921875, -173.50714111328125, -115.61636352539062, -57.7255859375, 0.16519927978515625, 58.05598449707031, 115.94677734375, 173.83755493164062, 231.72833251953125, 289.619140625, 347.5099182128906, 405.40069580078125, 463.2914733886719, 521.1822509765625, 579.0730590820312, 636.9638671875, 694.8546142578125, 752.7454223632812, 810.63623046875, 868.5269775390625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 11.0, 9.0, 17.0, 17.0, 17.0, 29.0, 35.0, 24.0, 43.0, 38.0, 45.0, 51.0, 49.0, 56.0, 61.0, 61.0, 65.0, 52.0, 51.0, 40.0, 32.0, 41.0, 28.0, 21.0, 23.0, 15.0, 15.0, 11.0, 8.0, 10.0, 2.0, 8.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-501.9755859375, -489.1772155761719, -476.3788757324219, -463.58050537109375, -450.78216552734375, -437.9837951660156, -425.1854248046875, -412.3870849609375, -399.5887451171875, -386.7903747558594, -373.9920349121094, -361.19366455078125, -348.39532470703125, -335.5969543457031, -322.798583984375, -310.000244140625, -297.2018737792969, -284.40350341796875, -271.60516357421875, -258.8067932128906, -246.00845336914062, -233.2100830078125, -220.41172790527344, -207.61337280273438, -194.8150177001953, -182.01666259765625, -169.2183074951172, -156.41995239257812, -143.62158203125, -130.8232421875, -118.02487182617188, -105.22651672363281, -92.42816162109375, -79.62980651855469, -66.83145141601562, -54.03308868408203, -41.23473358154297, -28.436378479003906, -15.638015747070312, -2.83966064453125, 9.958694458007812, 22.757051467895508, 35.5554084777832, 48.35376739501953, 61.152122497558594, 73.95047760009766, 86.74884033203125, 99.54719543457031, 112.34555053710938, 125.14390563964844, 137.9422607421875, 150.74063110351562, 163.53897094726562, 176.33734130859375, 189.1356964111328, 201.93405151367188, 214.73240661621094, 227.53076171875, 240.32911682128906, 253.12747192382812, 265.92584228515625, 278.72418212890625, 291.5225524902344, 304.3209228515625, 317.1192626953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 4.0, 10.0, 10.0, 16.0, 26.0, 31.0, 56.0, 67.0, 87.0, 141.0, 201.0, 310.0, 452.0, 708.0, 1110.0, 1916.0, 3214.0, 5941.0, 11975.0, 26634.0, 71570.0, 245060.0, 436232.0, 153206.0, 49025.0, 19795.0, 9087.0, 4660.0, 2642.0, 1579.0, 980.0, 590.0, 405.0, 276.0, 156.0, 122.0, 82.0, 52.0, 33.0, 34.0, 23.0, 17.0, 8.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.375, -36.05517578125, -34.7353515625, -33.41552734375, -32.095703125, -30.77587890625, -29.4560546875, -28.13623046875, -26.81640625, -25.49658203125, -24.1767578125, -22.85693359375, -21.537109375, -20.21728515625, -18.8974609375, -17.57763671875, -16.2578125, -14.93798828125, -13.6181640625, -12.29833984375, -10.978515625, -9.65869140625, -8.3388671875, -7.01904296875, -5.69921875, -4.37939453125, -3.0595703125, -1.73974609375, -0.419921875, 0.89990234375, 2.2197265625, 3.53955078125, 4.859375, 6.17919921875, 7.4990234375, 8.81884765625, 10.138671875, 11.45849609375, 12.7783203125, 14.09814453125, 15.41796875, 16.73779296875, 18.0576171875, 19.37744140625, 20.697265625, 22.01708984375, 23.3369140625, 24.65673828125, 25.9765625, 27.29638671875, 28.6162109375, 29.93603515625, 31.255859375, 32.57568359375, 33.8955078125, 35.21533203125, 36.53515625, 37.85498046875, 39.1748046875, 40.49462890625, 41.814453125, 43.13427734375, 44.4541015625, 45.77392578125, 47.09375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 7.0, 3.0, 3.0, 8.0, 6.0, 13.0, 6.0, 7.0, 9.0, 11.0, 17.0, 17.0, 15.0, 26.0, 26.0, 32.0, 31.0, 33.0, 39.0, 49.0, 29.0, 41.0, 30.0, 39.0, 49.0, 43.0, 39.0, 36.0, 42.0, 33.0, 30.0, 21.0, 28.0, 31.0, 32.0, 20.0, 20.0, 22.0, 14.0, 11.0, 2.0, 7.0, 5.0, 5.0, 3.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15625, -18.5546875, -17.953125, -17.3515625, -16.75, -16.1484375, -15.546875, -14.9453125, -14.34375, -13.7421875, -13.140625, -12.5390625, -11.9375, -11.3359375, -10.734375, -10.1328125, -9.53125, -8.9296875, -8.328125, -7.7265625, -7.125, -6.5234375, -5.921875, -5.3203125, -4.71875, -4.1171875, -3.515625, -2.9140625, -2.3125, -1.7109375, -1.109375, -0.5078125, 0.09375, 0.6953125, 1.296875, 1.8984375, 2.5, 3.1015625, 3.703125, 4.3046875, 4.90625, 5.5078125, 6.109375, 6.7109375, 7.3125, 7.9140625, 8.515625, 9.1171875, 9.71875, 10.3203125, 10.921875, 11.5234375, 12.125, 12.7265625, 13.328125, 13.9296875, 14.53125, 15.1328125, 15.734375, 16.3359375, 16.9375, 17.5390625, 18.140625, 18.7421875, 19.34375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 10.0, 14.0, 21.0, 36.0, 37.0, 50.0, 77.0, 151.0, 228.0, 423.0, 791.0, 1729.0, 4856.0, 21963.0, 345966.0, 635447.0, 27134.0, 5635.0, 1913.0, 906.0, 471.0, 248.0, 143.0, 89.0, 66.0, 38.0, 28.0, 22.0, 9.0, 6.0, 12.0, 9.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.1875, -104.3310546875, -100.474609375, -96.6181640625, -92.76171875, -88.9052734375, -85.048828125, -81.1923828125, -77.3359375, -73.4794921875, -69.623046875, -65.7666015625, -61.91015625, -58.0537109375, -54.197265625, -50.3408203125, -46.484375, -42.6279296875, -38.771484375, -34.9150390625, -31.05859375, -27.2021484375, -23.345703125, -19.4892578125, -15.6328125, -11.7763671875, -7.919921875, -4.0634765625, -0.20703125, 3.6494140625, 7.505859375, 11.3623046875, 15.21875, 19.0751953125, 22.931640625, 26.7880859375, 30.64453125, 34.5009765625, 38.357421875, 42.2138671875, 46.0703125, 49.9267578125, 53.783203125, 57.6396484375, 61.49609375, 65.3525390625, 69.208984375, 73.0654296875, 76.921875, 80.7783203125, 84.634765625, 88.4912109375, 92.34765625, 96.2041015625, 100.060546875, 103.9169921875, 107.7734375, 111.6298828125, 115.486328125, 119.3427734375, 123.19921875, 127.0556640625, 130.912109375, 134.7685546875, 138.625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 4.0, 5.0, 14.0, 12.0, 19.0, 18.0, 24.0, 34.0, 43.0, 67.0, 64.0, 73.0, 86.0, 78.0, 83.0, 59.0, 48.0, 52.0, 52.0, 54.0, 37.0, 28.0, 18.0, 7.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.9375, -102.3447265625, -97.751953125, -93.1591796875, -88.56640625, -83.9736328125, -79.380859375, -74.7880859375, -70.1953125, -65.6025390625, -61.009765625, -56.4169921875, -51.82421875, -47.2314453125, -42.638671875, -38.0458984375, -33.453125, -28.8603515625, -24.267578125, -19.6748046875, -15.08203125, -10.4892578125, -5.896484375, -1.3037109375, 3.2890625, 7.8818359375, 12.474609375, 17.0673828125, 21.66015625, 26.2529296875, 30.845703125, 35.4384765625, 40.03125, 44.6240234375, 49.216796875, 53.8095703125, 58.40234375, 62.9951171875, 67.587890625, 72.1806640625, 76.7734375, 81.3662109375, 85.958984375, 90.5517578125, 95.14453125, 99.7373046875, 104.330078125, 108.9228515625, 113.515625, 118.1083984375, 122.701171875, 127.2939453125, 131.88671875, 136.4794921875, 141.072265625, 145.6650390625, 150.2578125, 154.8505859375, 159.443359375, 164.0361328125, 168.62890625, 173.2216796875, 177.814453125, 182.4072265625, 187.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 11.0, 21.0, 30.0, 68.0, 130.0, 226.0, 549.0, 1550.0, 5965.0, 33554.0, 408036.0, 553649.0, 35670.0, 6294.0, 1689.0, 577.0, 261.0, 114.0, 64.0, 41.0, 14.0, 11.0, 7.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-42.1875, -40.90966796875, -39.6318359375, -38.35400390625, -37.076171875, -35.79833984375, -34.5205078125, -33.24267578125, -31.96484375, -30.68701171875, -29.4091796875, -28.13134765625, -26.853515625, -25.57568359375, -24.2978515625, -23.02001953125, -21.7421875, -20.46435546875, -19.1865234375, -17.90869140625, -16.630859375, -15.35302734375, -14.0751953125, -12.79736328125, -11.51953125, -10.24169921875, -8.9638671875, -7.68603515625, -6.408203125, -5.13037109375, -3.8525390625, -2.57470703125, -1.296875, -0.01904296875, 1.2587890625, 2.53662109375, 3.814453125, 5.09228515625, 6.3701171875, 7.64794921875, 8.92578125, 10.20361328125, 11.4814453125, 12.75927734375, 14.037109375, 15.31494140625, 16.5927734375, 17.87060546875, 19.1484375, 20.42626953125, 21.7041015625, 22.98193359375, 24.259765625, 25.53759765625, 26.8154296875, 28.09326171875, 29.37109375, 30.64892578125, 31.9267578125, 33.20458984375, 34.482421875, 35.76025390625, 37.0380859375, 38.31591796875, 39.59375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 11.0, 10.0, 18.0, 25.0, 30.0, 43.0, 66.0, 106.0, 116.0, 119.0, 114.0, 79.0, 59.0, 42.0, 28.0, 26.0, 19.0, 18.0, 6.0, 10.0, 8.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0094451904296875, -0.009199023246765137, -0.008952856063842773, -0.00870668888092041, -0.008460521697998047, -0.008214354515075684, -0.00796818733215332, -0.007722020149230957, -0.007475852966308594, -0.0072296857833862305, -0.006983518600463867, -0.006737351417541504, -0.006491184234619141, -0.006245017051696777, -0.005998849868774414, -0.005752682685852051, -0.0055065155029296875, -0.005260348320007324, -0.005014181137084961, -0.004768013954162598, -0.004521846771240234, -0.004275679588317871, -0.004029512405395508, -0.0037833452224731445, -0.0035371780395507812, -0.003291010856628418, -0.0030448436737060547, -0.0027986764907836914, -0.002552509307861328, -0.002306342124938965, -0.0020601749420166016, -0.0018140077590942383, -0.001567840576171875, -0.0013216733932495117, -0.0010755062103271484, -0.0008293390274047852, -0.0005831718444824219, -0.0003370046615600586, -9.083747863769531e-05, 0.00015532970428466797, 0.00040149688720703125, 0.0006476640701293945, 0.0008938312530517578, 0.001139998435974121, 0.0013861656188964844, 0.0016323328018188477, 0.001878499984741211, 0.0021246671676635742, 0.0023708343505859375, 0.0026170015335083008, 0.002863168716430664, 0.0031093358993530273, 0.0033555030822753906, 0.003601670265197754, 0.003847837448120117, 0.0040940046310424805, 0.004340171813964844, 0.004586338996887207, 0.00483250617980957, 0.005078673362731934, 0.005324840545654297, 0.00557100772857666, 0.0058171749114990234, 0.006063342094421387, 0.00630950927734375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 20.0, 25.0, 25.0, 52.0, 74.0, 127.0, 205.0, 348.0, 628.0, 1259.0, 2901.0, 8573.0, 37038.0, 286034.0, 628667.0, 63145.0, 12186.0, 3839.0, 1553.0, 759.0, 421.0, 245.0, 137.0, 99.0, 54.0, 43.0, 20.0, 25.0, 6.0, 9.0, 8.0, 1.0, 7.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.328125, -29.4130859375, -28.498046875, -27.5830078125, -26.66796875, -25.7529296875, -24.837890625, -23.9228515625, -23.0078125, -22.0927734375, -21.177734375, -20.2626953125, -19.34765625, -18.4326171875, -17.517578125, -16.6025390625, -15.6875, -14.7724609375, -13.857421875, -12.9423828125, -12.02734375, -11.1123046875, -10.197265625, -9.2822265625, -8.3671875, -7.4521484375, -6.537109375, -5.6220703125, -4.70703125, -3.7919921875, -2.876953125, -1.9619140625, -1.046875, -0.1318359375, 0.783203125, 1.6982421875, 2.61328125, 3.5283203125, 4.443359375, 5.3583984375, 6.2734375, 7.1884765625, 8.103515625, 9.0185546875, 9.93359375, 10.8486328125, 11.763671875, 12.6787109375, 13.59375, 14.5087890625, 15.423828125, 16.3388671875, 17.25390625, 18.1689453125, 19.083984375, 19.9990234375, 20.9140625, 21.8291015625, 22.744140625, 23.6591796875, 24.57421875, 25.4892578125, 26.404296875, 27.3193359375, 28.234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 1.0, 4.0, 5.0, 13.0, 7.0, 9.0, 11.0, 20.0, 20.0, 28.0, 35.0, 44.0, 51.0, 51.0, 87.0, 70.0, 103.0, 83.0, 66.0, 62.0, 41.0, 38.0, 43.0, 17.0, 15.0, 12.0, 12.0, 8.0, 8.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-22.703125, -21.979736328125, -21.25634765625, -20.532958984375, -19.8095703125, -19.086181640625, -18.36279296875, -17.639404296875, -16.916015625, -16.192626953125, -15.46923828125, -14.745849609375, -14.0224609375, -13.299072265625, -12.57568359375, -11.852294921875, -11.12890625, -10.405517578125, -9.68212890625, -8.958740234375, -8.2353515625, -7.511962890625, -6.78857421875, -6.065185546875, -5.341796875, -4.618408203125, -3.89501953125, -3.171630859375, -2.4482421875, -1.724853515625, -1.00146484375, -0.278076171875, 0.4453125, 1.168701171875, 1.89208984375, 2.615478515625, 3.3388671875, 4.062255859375, 4.78564453125, 5.509033203125, 6.232421875, 6.955810546875, 7.67919921875, 8.402587890625, 9.1259765625, 9.849365234375, 10.57275390625, 11.296142578125, 12.01953125, 12.742919921875, 13.46630859375, 14.189697265625, 14.9130859375, 15.636474609375, 16.35986328125, 17.083251953125, 17.806640625, 18.530029296875, 19.25341796875, 19.976806640625, 20.7001953125, 21.423583984375, 22.14697265625, 22.870361328125, 23.59375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 13.0, 7.0, 18.0, 27.0, 61.0, 97.0, 211.0, 250.0, 143.0, 74.0, 46.0, 14.0, 8.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-489.26275634765625, -468.1206359863281, -446.978515625, -425.83642578125, -404.6943054199219, -383.55218505859375, -362.41009521484375, -341.2679748535156, -320.1258544921875, -298.9837341308594, -277.84161376953125, -256.69952392578125, -235.55740356445312, -214.415283203125, -193.27317810058594, -172.13107299804688, -150.98895263671875, -129.84683227539062, -108.70472717285156, -87.56261444091797, -66.42050170898438, -45.27838897705078, -24.136276245117188, -2.994171142578125, 18.14794921875, 39.290061950683594, 60.43217468261719, 81.57428741455078, 102.71640014648438, 123.85851287841797, 145.00062561035156, 166.14273071289062, 187.2847900390625, 208.42691040039062, 229.5690155029297, 250.71112060546875, 271.8532409667969, 292.995361328125, 314.137451171875, 335.2795715332031, 356.42169189453125, 377.5638122558594, 398.7059326171875, 419.8480224609375, 440.9901428222656, 462.13226318359375, 483.27435302734375, 504.4164733886719, 525.55859375, 546.70068359375, 567.8428344726562, 588.9849243164062, 610.1270751953125, 631.2691650390625, 652.4112548828125, 673.5533447265625, 694.6954956054688, 715.8375854492188, 736.979736328125, 758.121826171875, 779.263916015625, 800.4060668945312, 821.5481567382812, 842.6903076171875, 863.8323974609375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 4.0, 15.0, 9.0, 11.0, 15.0, 19.0, 21.0, 30.0, 32.0, 32.0, 32.0, 45.0, 38.0, 61.0, 73.0, 87.0, 70.0, 63.0, 45.0, 49.0, 47.0, 31.0, 22.0, 27.0, 23.0, 18.0, 17.0, 13.0, 8.0, 8.0, 5.0, 8.0, 5.0, 2.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-465.87408447265625, -452.03192138671875, -438.1897277832031, -424.3475646972656, -410.50537109375, -396.6632080078125, -382.821044921875, -368.9788513183594, -355.13665771484375, -341.29449462890625, -327.4523010253906, -313.6101379394531, -299.7679443359375, -285.92578125, -272.0836181640625, -258.2414245605469, -244.39926147460938, -230.5570831298828, -216.71490478515625, -202.87274169921875, -189.03054809570312, -175.18838500976562, -161.34620666503906, -147.5040283203125, -133.66184997558594, -119.81967163085938, -105.97749328613281, -92.13532257080078, -78.29314422607422, -64.45096588134766, -50.608795166015625, -36.76661682128906, -22.9244384765625, -9.08226203918457, 4.759914398193359, 18.602088928222656, 32.44426727294922, 46.28644561767578, 60.12861633300781, 73.97079467773438, 87.81297302246094, 101.6551513671875, 115.49732971191406, 129.33950805664062, 143.18167114257812, 157.02386474609375, 170.86602783203125, 184.7082061767578, 198.55038452148438, 212.39256286621094, 226.2347412109375, 240.076904296875, 253.91909790039062, 267.7612609863281, 281.60345458984375, 295.44561767578125, 309.28778076171875, 323.12994384765625, 336.9721374511719, 350.8143005371094, 364.656494140625, 378.4986572265625, 392.3408203125, 406.1830139160156, 420.02520751953125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 6.0, 1.0, 8.0, 7.0, 11.0, 33.0, 38.0, 62.0, 78.0, 153.0, 263.0, 410.0, 748.0, 1541.0, 3086.0, 7211.0, 19071.0, 67473.0, 382478.0, 2269677.0, 1215356.0, 166475.0, 37190.0, 12688.0, 5197.0, 2392.0, 1170.0, 622.0, 354.0, 182.0, 118.0, 57.0, 56.0, 21.0, 21.0, 10.0, 6.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.875, -32.901123046875, -31.92724609375, -30.953369140625, -29.9794921875, -29.005615234375, -28.03173828125, -27.057861328125, -26.083984375, -25.110107421875, -24.13623046875, -23.162353515625, -22.1884765625, -21.214599609375, -20.24072265625, -19.266845703125, -18.29296875, -17.319091796875, -16.34521484375, -15.371337890625, -14.3974609375, -13.423583984375, -12.44970703125, -11.475830078125, -10.501953125, -9.528076171875, -8.55419921875, -7.580322265625, -6.6064453125, -5.632568359375, -4.65869140625, -3.684814453125, -2.7109375, -1.737060546875, -0.76318359375, 0.210693359375, 1.1845703125, 2.158447265625, 3.13232421875, 4.106201171875, 5.080078125, 6.053955078125, 7.02783203125, 8.001708984375, 8.9755859375, 9.949462890625, 10.92333984375, 11.897216796875, 12.87109375, 13.844970703125, 14.81884765625, 15.792724609375, 16.7666015625, 17.740478515625, 18.71435546875, 19.688232421875, 20.662109375, 21.635986328125, 22.60986328125, 23.583740234375, 24.5576171875, 25.531494140625, 26.50537109375, 27.479248046875, 28.453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 8.0, 8.0, 17.0, 15.0, 15.0, 16.0, 23.0, 26.0, 28.0, 29.0, 44.0, 37.0, 46.0, 41.0, 40.0, 36.0, 51.0, 56.0, 56.0, 37.0, 61.0, 32.0, 36.0, 32.0, 20.0, 30.0, 25.0, 21.0, 21.0, 16.0, 12.0, 7.0, 8.0, 5.0, 4.0, 6.0, 5.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-22.359375, -21.698486328125, -21.03759765625, -20.376708984375, -19.7158203125, -19.054931640625, -18.39404296875, -17.733154296875, -17.072265625, -16.411376953125, -15.75048828125, -15.089599609375, -14.4287109375, -13.767822265625, -13.10693359375, -12.446044921875, -11.78515625, -11.124267578125, -10.46337890625, -9.802490234375, -9.1416015625, -8.480712890625, -7.81982421875, -7.158935546875, -6.498046875, -5.837158203125, -5.17626953125, -4.515380859375, -3.8544921875, -3.193603515625, -2.53271484375, -1.871826171875, -1.2109375, -0.550048828125, 0.11083984375, 0.771728515625, 1.4326171875, 2.093505859375, 2.75439453125, 3.415283203125, 4.076171875, 4.737060546875, 5.39794921875, 6.058837890625, 6.7197265625, 7.380615234375, 8.04150390625, 8.702392578125, 9.36328125, 10.024169921875, 10.68505859375, 11.345947265625, 12.0068359375, 12.667724609375, 13.32861328125, 13.989501953125, 14.650390625, 15.311279296875, 15.97216796875, 16.633056640625, 17.2939453125, 17.954833984375, 18.61572265625, 19.276611328125, 19.9375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 6.0, 9.0, 8.0, 20.0, 26.0, 47.0, 99.0, 138.0, 317.0, 705.0, 2130.0, 7611.0, 36765.0, 449183.0, 3505023.0, 164824.0, 20529.0, 4548.0, 1320.0, 507.0, 200.0, 107.0, 53.0, 28.0, 21.0, 14.0, 9.0, 10.0, 6.0, 6.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.375, -92.8212890625, -90.267578125, -87.7138671875, -85.16015625, -82.6064453125, -80.052734375, -77.4990234375, -74.9453125, -72.3916015625, -69.837890625, -67.2841796875, -64.73046875, -62.1767578125, -59.623046875, -57.0693359375, -54.515625, -51.9619140625, -49.408203125, -46.8544921875, -44.30078125, -41.7470703125, -39.193359375, -36.6396484375, -34.0859375, -31.5322265625, -28.978515625, -26.4248046875, -23.87109375, -21.3173828125, -18.763671875, -16.2099609375, -13.65625, -11.1025390625, -8.548828125, -5.9951171875, -3.44140625, -0.8876953125, 1.666015625, 4.2197265625, 6.7734375, 9.3271484375, 11.880859375, 14.4345703125, 16.98828125, 19.5419921875, 22.095703125, 24.6494140625, 27.203125, 29.7568359375, 32.310546875, 34.8642578125, 37.41796875, 39.9716796875, 42.525390625, 45.0791015625, 47.6328125, 50.1865234375, 52.740234375, 55.2939453125, 57.84765625, 60.4013671875, 62.955078125, 65.5087890625, 68.0625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 1.0, 5.0, 14.0, 13.0, 10.0, 24.0, 24.0, 32.0, 52.0, 99.0, 125.0, 289.0, 537.0, 840.0, 884.0, 496.0, 260.0, 145.0, 72.0, 56.0, 31.0, 21.0, 13.0, 16.0, 8.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-111.875, -109.271484375, -106.66796875, -104.064453125, -101.4609375, -98.857421875, -96.25390625, -93.650390625, -91.046875, -88.443359375, -85.83984375, -83.236328125, -80.6328125, -78.029296875, -75.42578125, -72.822265625, -70.21875, -67.615234375, -65.01171875, -62.408203125, -59.8046875, -57.201171875, -54.59765625, -51.994140625, -49.390625, -46.787109375, -44.18359375, -41.580078125, -38.9765625, -36.373046875, -33.76953125, -31.166015625, -28.5625, -25.958984375, -23.35546875, -20.751953125, -18.1484375, -15.544921875, -12.94140625, -10.337890625, -7.734375, -5.130859375, -2.52734375, 0.076171875, 2.6796875, 5.283203125, 7.88671875, 10.490234375, 13.09375, 15.697265625, 18.30078125, 20.904296875, 23.5078125, 26.111328125, 28.71484375, 31.318359375, 33.921875, 36.525390625, 39.12890625, 41.732421875, 44.3359375, 46.939453125, 49.54296875, 52.146484375, 54.75]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 12.0, 23.0, 86.0, 343.0, 393.0, 104.0, 23.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2430.1484375, -2381.74462890625, -2333.3408203125, -2284.93701171875, -2236.533203125, -2188.12939453125, -2139.7255859375, -2091.32177734375, -2042.9180908203125, -1994.5142822265625, -1946.1104736328125, -1897.7066650390625, -1849.3028564453125, -1800.899169921875, -1752.495361328125, -1704.091552734375, -1655.687744140625, -1607.283935546875, -1558.880126953125, -1510.476318359375, -1462.072509765625, -1413.668701171875, -1365.264892578125, -1316.8612060546875, -1268.457275390625, -1220.053466796875, -1171.649658203125, -1123.245849609375, -1074.842041015625, -1026.438232421875, -978.0344848632812, -929.6307373046875, -881.2269287109375, -832.8231201171875, -784.4193115234375, -736.0155029296875, -687.6117553710938, -639.2079467773438, -590.8041381835938, -542.400390625, -493.9965515136719, -445.5927429199219, -397.18896484375, -348.78515625, -300.38134765625, -251.97756958007812, -203.57376098632812, -155.16998291015625, -106.76617431640625, -58.36237716674805, -9.958580017089844, 38.445220947265625, 86.84901428222656, 135.2528076171875, 183.6566162109375, 232.06039428710938, 280.4642028808594, 328.8680114746094, 377.27178955078125, 425.67559814453125, 474.07940673828125, 522.483154296875, 570.886962890625, 619.290771484375, 667.694580078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 5.0, 10.0, 6.0, 9.0, 21.0, 14.0, 16.0, 30.0, 24.0, 31.0, 28.0, 29.0, 42.0, 42.0, 42.0, 46.0, 46.0, 56.0, 47.0, 62.0, 53.0, 44.0, 38.0, 31.0, 31.0, 31.0, 25.0, 31.0, 22.0, 13.0, 22.0, 11.0, 6.0, 8.0, 7.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-352.5919494628906, -342.6274719238281, -332.6629638671875, -322.698486328125, -312.7340087890625, -302.76953125, -292.8050231933594, -282.8405456542969, -272.87603759765625, -262.91156005859375, -252.9470672607422, -242.98257446289062, -233.01809692382812, -223.05360412597656, -213.089111328125, -203.1246337890625, -193.16015625, -183.19566345214844, -173.23118591308594, -163.26669311523438, -153.30221557617188, -143.3377227783203, -133.37322998046875, -123.40874481201172, -113.44425964355469, -103.47977447509766, -93.51528930664062, -83.55079650878906, -73.58631134033203, -63.621826171875, -53.6573371887207, -43.692848205566406, -33.728363037109375, -23.76387596130371, -13.799388885498047, -3.834901809692383, 6.129585266113281, 16.094070434570312, 26.05855941772461, 36.023048400878906, 45.98753356933594, 55.95201873779297, 65.91650390625, 75.88099670410156, 85.8454818725586, 95.80996704101562, 105.77445983886719, 115.73894500732422, 125.70343017578125, 135.6679229736328, 145.6324005126953, 155.59689331054688, 165.56137084960938, 175.52586364746094, 185.4903564453125, 195.454833984375, 205.41932678222656, 215.38381958007812, 225.34829711914062, 235.3127899169922, 245.27728271484375, 255.24176025390625, 265.20623779296875, 275.1707458496094, 285.1352233886719]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 5.0, 9.0, 19.0, 25.0, 44.0, 44.0, 64.0, 106.0, 179.0, 261.0, 436.0, 663.0, 1199.0, 2115.0, 4131.0, 10233.0, 36115.0, 182647.0, 538887.0, 209722.0, 40714.0, 11100.0, 4425.0, 2256.0, 1196.0, 733.0, 424.0, 275.0, 153.0, 116.0, 75.0, 53.0, 44.0, 26.0, 22.0, 11.0, 12.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.03125, -45.5859375, -44.140625, -42.6953125, -41.25, -39.8046875, -38.359375, -36.9140625, -35.46875, -34.0234375, -32.578125, -31.1328125, -29.6875, -28.2421875, -26.796875, -25.3515625, -23.90625, -22.4609375, -21.015625, -19.5703125, -18.125, -16.6796875, -15.234375, -13.7890625, -12.34375, -10.8984375, -9.453125, -8.0078125, -6.5625, -5.1171875, -3.671875, -2.2265625, -0.78125, 0.6640625, 2.109375, 3.5546875, 5.0, 6.4453125, 7.890625, 9.3359375, 10.78125, 12.2265625, 13.671875, 15.1171875, 16.5625, 18.0078125, 19.453125, 20.8984375, 22.34375, 23.7890625, 25.234375, 26.6796875, 28.125, 29.5703125, 31.015625, 32.4609375, 33.90625, 35.3515625, 36.796875, 38.2421875, 39.6875, 41.1328125, 42.578125, 44.0234375, 45.46875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 7.0, 4.0, 1.0, 5.0, 9.0, 16.0, 9.0, 14.0, 17.0, 15.0, 21.0, 29.0, 29.0, 27.0, 28.0, 40.0, 48.0, 50.0, 38.0, 50.0, 41.0, 62.0, 46.0, 39.0, 41.0, 33.0, 37.0, 32.0, 33.0, 25.0, 31.0, 25.0, 21.0, 21.0, 19.0, 12.0, 9.0, 3.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.521484375, -20.80859375, -20.095703125, -19.3828125, -18.669921875, -17.95703125, -17.244140625, -16.53125, -15.818359375, -15.10546875, -14.392578125, -13.6796875, -12.966796875, -12.25390625, -11.541015625, -10.828125, -10.115234375, -9.40234375, -8.689453125, -7.9765625, -7.263671875, -6.55078125, -5.837890625, -5.125, -4.412109375, -3.69921875, -2.986328125, -2.2734375, -1.560546875, -0.84765625, -0.134765625, 0.578125, 1.291015625, 2.00390625, 2.716796875, 3.4296875, 4.142578125, 4.85546875, 5.568359375, 6.28125, 6.994140625, 7.70703125, 8.419921875, 9.1328125, 9.845703125, 10.55859375, 11.271484375, 11.984375, 12.697265625, 13.41015625, 14.123046875, 14.8359375, 15.548828125, 16.26171875, 16.974609375, 17.6875, 18.400390625, 19.11328125, 19.826171875, 20.5390625, 21.251953125, 21.96484375, 22.677734375, 23.390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 8.0, 10.0, 4.0, 14.0, 18.0, 17.0, 22.0, 25.0, 48.0, 76.0, 118.0, 165.0, 326.0, 596.0, 1221.0, 3247.0, 13120.0, 145716.0, 813531.0, 57733.0, 7971.0, 2363.0, 1000.0, 520.0, 245.0, 160.0, 79.0, 52.0, 45.0, 26.0, 20.0, 12.0, 9.0, 13.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-88.625, -85.884765625, -83.14453125, -80.404296875, -77.6640625, -74.923828125, -72.18359375, -69.443359375, -66.703125, -63.962890625, -61.22265625, -58.482421875, -55.7421875, -53.001953125, -50.26171875, -47.521484375, -44.78125, -42.041015625, -39.30078125, -36.560546875, -33.8203125, -31.080078125, -28.33984375, -25.599609375, -22.859375, -20.119140625, -17.37890625, -14.638671875, -11.8984375, -9.158203125, -6.41796875, -3.677734375, -0.9375, 1.802734375, 4.54296875, 7.283203125, 10.0234375, 12.763671875, 15.50390625, 18.244140625, 20.984375, 23.724609375, 26.46484375, 29.205078125, 31.9453125, 34.685546875, 37.42578125, 40.166015625, 42.90625, 45.646484375, 48.38671875, 51.126953125, 53.8671875, 56.607421875, 59.34765625, 62.087890625, 64.828125, 67.568359375, 70.30859375, 73.048828125, 75.7890625, 78.529296875, 81.26953125, 84.009765625, 86.75]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 8.0, 4.0, 10.0, 10.0, 11.0, 13.0, 13.0, 24.0, 23.0, 33.0, 47.0, 54.0, 50.0, 55.0, 73.0, 63.0, 62.0, 90.0, 63.0, 51.0, 50.0, 48.0, 35.0, 28.0, 25.0, 19.0, 12.0, 7.0, 5.0, 2.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.875, -116.9765625, -113.078125, -109.1796875, -105.28125, -101.3828125, -97.484375, -93.5859375, -89.6875, -85.7890625, -81.890625, -77.9921875, -74.09375, -70.1953125, -66.296875, -62.3984375, -58.5, -54.6015625, -50.703125, -46.8046875, -42.90625, -39.0078125, -35.109375, -31.2109375, -27.3125, -23.4140625, -19.515625, -15.6171875, -11.71875, -7.8203125, -3.921875, -0.0234375, 3.875, 7.7734375, 11.671875, 15.5703125, 19.46875, 23.3671875, 27.265625, 31.1640625, 35.0625, 38.9609375, 42.859375, 46.7578125, 50.65625, 54.5546875, 58.453125, 62.3515625, 66.25, 70.1484375, 74.046875, 77.9453125, 81.84375, 85.7421875, 89.640625, 93.5390625, 97.4375, 101.3359375, 105.234375, 109.1328125, 113.03125, 116.9296875, 120.828125, 124.7265625, 128.625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 9.0, 9.0, 8.0, 21.0, 26.0, 22.0, 51.0, 68.0, 89.0, 142.0, 285.0, 533.0, 1013.0, 2228.0, 5205.0, 15386.0, 63336.0, 503064.0, 371288.0, 61267.0, 15080.0, 5113.0, 2095.0, 1029.0, 477.0, 252.0, 145.0, 91.0, 67.0, 41.0, 25.0, 33.0, 11.0, 11.0, 8.0, 9.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.109375, -23.305419921875, -22.50146484375, -21.697509765625, -20.8935546875, -20.089599609375, -19.28564453125, -18.481689453125, -17.677734375, -16.873779296875, -16.06982421875, -15.265869140625, -14.4619140625, -13.657958984375, -12.85400390625, -12.050048828125, -11.24609375, -10.442138671875, -9.63818359375, -8.834228515625, -8.0302734375, -7.226318359375, -6.42236328125, -5.618408203125, -4.814453125, -4.010498046875, -3.20654296875, -2.402587890625, -1.5986328125, -0.794677734375, 0.00927734375, 0.813232421875, 1.6171875, 2.421142578125, 3.22509765625, 4.029052734375, 4.8330078125, 5.636962890625, 6.44091796875, 7.244873046875, 8.048828125, 8.852783203125, 9.65673828125, 10.460693359375, 11.2646484375, 12.068603515625, 12.87255859375, 13.676513671875, 14.48046875, 15.284423828125, 16.08837890625, 16.892333984375, 17.6962890625, 18.500244140625, 19.30419921875, 20.108154296875, 20.912109375, 21.716064453125, 22.52001953125, 23.323974609375, 24.1279296875, 24.931884765625, 25.73583984375, 26.539794921875, 27.34375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 9.0, 8.0, 19.0, 24.0, 43.0, 64.0, 79.0, 96.0, 131.0, 91.0, 120.0, 97.0, 58.0, 39.0, 31.0, 30.0, 8.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0085296630859375, -0.00829392671585083, -0.00805819034576416, -0.00782245397567749, -0.00758671760559082, -0.00735098123550415, -0.0071152448654174805, -0.0068795084953308105, -0.006643772125244141, -0.006408035755157471, -0.006172299385070801, -0.005936563014984131, -0.005700826644897461, -0.005465090274810791, -0.005229353904724121, -0.004993617534637451, -0.004757881164550781, -0.004522144794464111, -0.004286408424377441, -0.0040506720542907715, -0.0038149356842041016, -0.0035791993141174316, -0.0033434629440307617, -0.003107726573944092, -0.002871990203857422, -0.002636253833770752, -0.002400517463684082, -0.002164781093597412, -0.0019290447235107422, -0.0016933083534240723, -0.0014575719833374023, -0.0012218356132507324, -0.0009860992431640625, -0.0007503628730773926, -0.0005146265029907227, -0.00027889013290405273, -4.315376281738281e-05, 0.0001925826072692871, 0.00042831897735595703, 0.000664055347442627, 0.0008997917175292969, 0.0011355280876159668, 0.0013712644577026367, 0.0016070008277893066, 0.0018427371978759766, 0.0020784735679626465, 0.0023142099380493164, 0.0025499463081359863, 0.0027856826782226562, 0.003021419048309326, 0.003257155418395996, 0.003492891788482666, 0.003728628158569336, 0.003964364528656006, 0.004200100898742676, 0.004435837268829346, 0.004671573638916016, 0.0049073100090026855, 0.0051430463790893555, 0.005378782749176025, 0.005614519119262695, 0.005850255489349365, 0.006085991859436035, 0.006321728229522705, 0.006557464599609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 13.0, 19.0, 30.0, 62.0, 101.0, 219.0, 570.0, 1749.0, 7511.0, 69053.0, 825966.0, 128366.0, 11275.0, 2328.0, 737.0, 295.0, 122.0, 65.0, 23.0, 26.0, 14.0, 6.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.296875, -26.853759765625, -25.41064453125, -23.967529296875, -22.5244140625, -21.081298828125, -19.63818359375, -18.195068359375, -16.751953125, -15.308837890625, -13.86572265625, -12.422607421875, -10.9794921875, -9.536376953125, -8.09326171875, -6.650146484375, -5.20703125, -3.763916015625, -2.32080078125, -0.877685546875, 0.5654296875, 2.008544921875, 3.45166015625, 4.894775390625, 6.337890625, 7.781005859375, 9.22412109375, 10.667236328125, 12.1103515625, 13.553466796875, 14.99658203125, 16.439697265625, 17.8828125, 19.325927734375, 20.76904296875, 22.212158203125, 23.6552734375, 25.098388671875, 26.54150390625, 27.984619140625, 29.427734375, 30.870849609375, 32.31396484375, 33.757080078125, 35.2001953125, 36.643310546875, 38.08642578125, 39.529541015625, 40.97265625, 42.415771484375, 43.85888671875, 45.302001953125, 46.7451171875, 48.188232421875, 49.63134765625, 51.074462890625, 52.517578125, 53.960693359375, 55.40380859375, 56.846923828125, 58.2900390625, 59.733154296875, 61.17626953125, 62.619384765625, 64.0625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 7.0, 11.0, 10.0, 11.0, 15.0, 26.0, 34.0, 48.0, 61.0, 82.0, 67.0, 84.0, 87.0, 99.0, 88.0, 58.0, 61.0, 34.0, 35.0, 25.0, 15.0, 7.0, 7.0, 6.0, 6.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.375, -32.521728515625, -31.66845703125, -30.815185546875, -29.9619140625, -29.108642578125, -28.25537109375, -27.402099609375, -26.548828125, -25.695556640625, -24.84228515625, -23.989013671875, -23.1357421875, -22.282470703125, -21.42919921875, -20.575927734375, -19.72265625, -18.869384765625, -18.01611328125, -17.162841796875, -16.3095703125, -15.456298828125, -14.60302734375, -13.749755859375, -12.896484375, -12.043212890625, -11.18994140625, -10.336669921875, -9.4833984375, -8.630126953125, -7.77685546875, -6.923583984375, -6.0703125, -5.217041015625, -4.36376953125, -3.510498046875, -2.6572265625, -1.803955078125, -0.95068359375, -0.097412109375, 0.755859375, 1.609130859375, 2.46240234375, 3.315673828125, 4.1689453125, 5.022216796875, 5.87548828125, 6.728759765625, 7.58203125, 8.435302734375, 9.28857421875, 10.141845703125, 10.9951171875, 11.848388671875, 12.70166015625, 13.554931640625, 14.408203125, 15.261474609375, 16.11474609375, 16.968017578125, 17.8212890625, 18.674560546875, 19.52783203125, 20.381103515625, 21.234375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 16.0, 23.0, 45.0, 49.0, 93.0, 162.0, 227.0, 131.0, 87.0, 61.0, 35.0, 18.0, 10.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-369.34765625, -355.2655029296875, -341.183349609375, -327.1011962890625, -313.0190734863281, -298.9369201660156, -284.8547668457031, -270.7726135253906, -256.69049072265625, -242.60833740234375, -228.5261993408203, -214.4440460205078, -200.36190795898438, -186.27975463867188, -172.19760131835938, -158.11544799804688, -144.03329467773438, -129.95114135742188, -115.86900329589844, -101.78684997558594, -87.70470428466797, -73.62255859375, -59.5404052734375, -45.45825958251953, -31.376113891601562, -17.29396629333496, -3.2118186950683594, 10.870330810546875, 24.952476501464844, 39.03462219238281, 53.11677551269531, 67.19892120361328, 81.28106689453125, 95.36321258544922, 109.44535827636719, 123.52751159667969, 137.60964965820312, 151.69180297851562, 165.77395629882812, 179.85610961914062, 193.93824768066406, 208.02040100097656, 222.1025390625, 236.1846923828125, 250.266845703125, 264.3489990234375, 278.43115234375, 292.5132751464844, 306.5954284667969, 320.6775817871094, 334.7597351074219, 348.84185791015625, 362.92401123046875, 377.00616455078125, 391.08831787109375, 405.17047119140625, 419.25262451171875, 433.33477783203125, 447.41693115234375, 461.49908447265625, 475.5812072753906, 489.6633605957031, 503.7455139160156, 517.82763671875, 531.9097900390625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 2.0, 0.0, 5.0, 3.0, 4.0, 4.0, 6.0, 3.0, 8.0, 13.0, 13.0, 11.0, 20.0, 18.0, 19.0, 19.0, 26.0, 27.0, 35.0, 29.0, 41.0, 41.0, 57.0, 81.0, 79.0, 73.0, 47.0, 40.0, 37.0, 34.0, 32.0, 17.0, 32.0, 24.0, 16.0, 18.0, 15.0, 10.0, 8.0, 10.0, 3.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-368.02923583984375, -356.7095031738281, -345.3897705078125, -334.0700378417969, -322.75030517578125, -311.4305725097656, -300.11083984375, -288.79107666015625, -277.47137451171875, -266.1516418457031, -254.8319091796875, -243.51217651367188, -232.19244384765625, -220.87271118164062, -209.55296325683594, -198.2332305908203, -186.91348266601562, -175.59375, -164.27401733398438, -152.95428466796875, -141.63455200195312, -130.3148193359375, -118.99507141113281, -107.67533874511719, -96.35560607910156, -85.03587341308594, -73.71614074707031, -62.396400451660156, -51.07666778564453, -39.756935119628906, -28.43719482421875, -17.117462158203125, -5.7977294921875, 5.522005081176758, 16.841739654541016, 28.161476135253906, 39.48120880126953, 50.800941467285156, 62.12068176269531, 73.44041442871094, 84.76014709472656, 96.07987976074219, 107.39961242675781, 118.71935272216797, 130.03909301757812, 141.35882568359375, 152.67855834960938, 163.998291015625, 175.31802368164062, 186.63775634765625, 197.95748901367188, 209.2772216796875, 220.59695434570312, 231.91668701171875, 243.23643493652344, 254.55616760253906, 265.87591552734375, 277.1956481933594, 288.515380859375, 299.8351135253906, 311.15484619140625, 322.4745788574219, 333.7943115234375, 345.11407470703125, 356.43377685546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 3.0, 7.0, 7.0, 11.0, 13.0, 28.0, 38.0, 33.0, 74.0, 106.0, 182.0, 292.0, 449.0, 745.0, 1306.0, 2417.0, 4594.0, 9979.0, 25450.0, 84306.0, 365370.0, 1644226.0, 1580511.0, 348183.0, 80905.0, 24706.0, 10115.0, 4604.0, 2357.0, 1253.0, 748.0, 467.0, 263.0, 166.0, 132.0, 72.0, 57.0, 29.0, 19.0, 17.0, 9.0, 7.0, 10.0, 7.0, 2.0, 3.0, 2.0], "bins": [-29.359375, -28.606201171875, -27.85302734375, -27.099853515625, -26.3466796875, -25.593505859375, -24.84033203125, -24.087158203125, -23.333984375, -22.580810546875, -21.82763671875, -21.074462890625, -20.3212890625, -19.568115234375, -18.81494140625, -18.061767578125, -17.30859375, -16.555419921875, -15.80224609375, -15.049072265625, -14.2958984375, -13.542724609375, -12.78955078125, -12.036376953125, -11.283203125, -10.530029296875, -9.77685546875, -9.023681640625, -8.2705078125, -7.517333984375, -6.76416015625, -6.010986328125, -5.2578125, -4.504638671875, -3.75146484375, -2.998291015625, -2.2451171875, -1.491943359375, -0.73876953125, 0.014404296875, 0.767578125, 1.520751953125, 2.27392578125, 3.027099609375, 3.7802734375, 4.533447265625, 5.28662109375, 6.039794921875, 6.79296875, 7.546142578125, 8.29931640625, 9.052490234375, 9.8056640625, 10.558837890625, 11.31201171875, 12.065185546875, 12.818359375, 13.571533203125, 14.32470703125, 15.077880859375, 15.8310546875, 16.584228515625, 17.33740234375, 18.090576171875, 18.84375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 3.0, 5.0, 9.0, 8.0, 13.0, 9.0, 17.0, 22.0, 19.0, 29.0, 21.0, 25.0, 33.0, 40.0, 35.0, 34.0, 44.0, 48.0, 45.0, 50.0, 52.0, 37.0, 49.0, 51.0, 37.0, 39.0, 36.0, 41.0, 21.0, 18.0, 24.0, 22.0, 9.0, 10.0, 11.0, 7.0, 7.0, 4.0, 1.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.501953125, -22.75390625, -22.005859375, -21.2578125, -20.509765625, -19.76171875, -19.013671875, -18.265625, -17.517578125, -16.76953125, -16.021484375, -15.2734375, -14.525390625, -13.77734375, -13.029296875, -12.28125, -11.533203125, -10.78515625, -10.037109375, -9.2890625, -8.541015625, -7.79296875, -7.044921875, -6.296875, -5.548828125, -4.80078125, -4.052734375, -3.3046875, -2.556640625, -1.80859375, -1.060546875, -0.3125, 0.435546875, 1.18359375, 1.931640625, 2.6796875, 3.427734375, 4.17578125, 4.923828125, 5.671875, 6.419921875, 7.16796875, 7.916015625, 8.6640625, 9.412109375, 10.16015625, 10.908203125, 11.65625, 12.404296875, 13.15234375, 13.900390625, 14.6484375, 15.396484375, 16.14453125, 16.892578125, 17.640625, 18.388671875, 19.13671875, 19.884765625, 20.6328125, 21.380859375, 22.12890625, 22.876953125, 23.625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 8.0, 5.0, 17.0, 30.0, 53.0, 79.0, 152.0, 312.0, 844.0, 2506.0, 10212.0, 64766.0, 2154953.0, 1885800.0, 60863.0, 9752.0, 2407.0, 781.0, 356.0, 132.0, 90.0, 42.0, 28.0, 29.0, 14.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.875, -61.5078125, -59.140625, -56.7734375, -54.40625, -52.0390625, -49.671875, -47.3046875, -44.9375, -42.5703125, -40.203125, -37.8359375, -35.46875, -33.1015625, -30.734375, -28.3671875, -26.0, -23.6328125, -21.265625, -18.8984375, -16.53125, -14.1640625, -11.796875, -9.4296875, -7.0625, -4.6953125, -2.328125, 0.0390625, 2.40625, 4.7734375, 7.140625, 9.5078125, 11.875, 14.2421875, 16.609375, 18.9765625, 21.34375, 23.7109375, 26.078125, 28.4453125, 30.8125, 33.1796875, 35.546875, 37.9140625, 40.28125, 42.6484375, 45.015625, 47.3828125, 49.75, 52.1171875, 54.484375, 56.8515625, 59.21875, 61.5859375, 63.953125, 66.3203125, 68.6875, 71.0546875, 73.421875, 75.7890625, 78.15625, 80.5234375, 82.890625, 85.2578125, 87.625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 12.0, 6.0, 8.0, 12.0, 25.0, 26.0, 23.0, 41.0, 59.0, 113.0, 148.0, 219.0, 334.0, 491.0, 638.0, 606.0, 393.0, 295.0, 171.0, 141.0, 64.0, 54.0, 39.0, 35.0, 22.0, 17.0, 13.0, 7.0, 8.0, 8.0, 10.0, 5.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-52.78125, -51.21728515625, -49.6533203125, -48.08935546875, -46.525390625, -44.96142578125, -43.3974609375, -41.83349609375, -40.26953125, -38.70556640625, -37.1416015625, -35.57763671875, -34.013671875, -32.44970703125, -30.8857421875, -29.32177734375, -27.7578125, -26.19384765625, -24.6298828125, -23.06591796875, -21.501953125, -19.93798828125, -18.3740234375, -16.81005859375, -15.24609375, -13.68212890625, -12.1181640625, -10.55419921875, -8.990234375, -7.42626953125, -5.8623046875, -4.29833984375, -2.734375, -1.17041015625, 0.3935546875, 1.95751953125, 3.521484375, 5.08544921875, 6.6494140625, 8.21337890625, 9.77734375, 11.34130859375, 12.9052734375, 14.46923828125, 16.033203125, 17.59716796875, 19.1611328125, 20.72509765625, 22.2890625, 23.85302734375, 25.4169921875, 26.98095703125, 28.544921875, 30.10888671875, 31.6728515625, 33.23681640625, 34.80078125, 36.36474609375, 37.9287109375, 39.49267578125, 41.056640625, 42.62060546875, 44.1845703125, 45.74853515625, 47.3125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 14.0, 18.0, 37.0, 94.0, 174.0, 239.0, 212.0, 111.0, 50.0, 22.0, 6.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-671.1571044921875, -649.3225708007812, -627.4880981445312, -605.653564453125, -583.819091796875, -561.9845581054688, -540.1500244140625, -518.3155517578125, -496.4810485839844, -474.64654541015625, -452.8120422363281, -430.9775390625, -409.14300537109375, -387.30853271484375, -365.4739990234375, -343.6394958496094, -321.80499267578125, -299.9704895019531, -278.135986328125, -256.30145263671875, -234.4669647216797, -212.63246154785156, -190.79794311523438, -168.96343994140625, -147.12893676757812, -125.29443359375, -103.45992279052734, -81.62541198730469, -59.79090881347656, -37.95640563964844, -16.12188720703125, 5.712615966796875, 27.54718017578125, 49.38168716430664, 71.21619415283203, 93.05070495605469, 114.88520812988281, 136.71971130371094, 158.55422973632812, 180.38873291015625, 202.22323608398438, 224.0577392578125, 245.89224243164062, 267.72674560546875, 289.561279296875, 311.395751953125, 333.23028564453125, 355.0647888183594, 376.8992919921875, 398.7337951660156, 420.56829833984375, 442.40283203125, 464.2373046875, 486.07183837890625, 507.9063415527344, 529.7408447265625, 551.5753173828125, 573.4098510742188, 595.2443237304688, 617.078857421875, 638.913330078125, 660.7478637695312, 682.5823974609375, 704.4168701171875, 726.2514038085938]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 5.0, 7.0, 21.0, 12.0, 11.0, 16.0, 23.0, 30.0, 44.0, 28.0, 51.0, 52.0, 64.0, 53.0, 67.0, 62.0, 66.0, 58.0, 55.0, 52.0, 38.0, 28.0, 33.0, 33.0, 22.0, 16.0, 13.0, 9.0, 9.0, 2.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-360.1078796386719, -349.8678283691406, -339.62774658203125, -329.3876953125, -319.1476135253906, -308.9075622558594, -298.66748046875, -288.42742919921875, -278.1873779296875, -267.94732666015625, -257.7072448730469, -247.46717834472656, -237.22711181640625, -226.987060546875, -216.7469940185547, -206.50692749023438, -196.266845703125, -186.0267791748047, -175.78671264648438, -165.54664611816406, -155.30657958984375, -145.0665283203125, -134.8264617919922, -124.58639526367188, -114.34632873535156, -104.10626220703125, -93.86619567871094, -83.62613677978516, -73.38607025146484, -63.14600372314453, -52.905941009521484, -42.66587829589844, -32.42584228515625, -22.18577766418457, -11.94571304321289, -1.705648422241211, 8.534416198730469, 18.77448272705078, 29.014545440673828, 39.254608154296875, 49.49467468261719, 59.7347412109375, 69.97480773925781, 80.2148666381836, 90.4549331665039, 100.69499969482422, 110.93505859375, 121.17512512207031, 131.41519165039062, 141.65525817871094, 151.89532470703125, 162.13539123535156, 172.37545776367188, 182.61550903320312, 192.85557556152344, 203.09564208984375, 213.33570861816406, 223.57577514648438, 233.8158416748047, 244.055908203125, 254.29595947265625, 264.5360412597656, 274.7760925292969, 285.01617431640625, 295.2562255859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 6.0, 15.0, 17.0, 31.0, 57.0, 78.0, 123.0, 220.0, 349.0, 568.0, 1223.0, 2834.0, 7896.0, 29514.0, 180777.0, 636847.0, 150245.0, 25513.0, 7062.0, 2525.0, 1164.0, 584.0, 349.0, 219.0, 102.0, 80.0, 54.0, 34.0, 17.0, 19.0, 11.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.40625, -52.8271484375, -51.248046875, -49.6689453125, -48.08984375, -46.5107421875, -44.931640625, -43.3525390625, -41.7734375, -40.1943359375, -38.615234375, -37.0361328125, -35.45703125, -33.8779296875, -32.298828125, -30.7197265625, -29.140625, -27.5615234375, -25.982421875, -24.4033203125, -22.82421875, -21.2451171875, -19.666015625, -18.0869140625, -16.5078125, -14.9287109375, -13.349609375, -11.7705078125, -10.19140625, -8.6123046875, -7.033203125, -5.4541015625, -3.875, -2.2958984375, -0.716796875, 0.8623046875, 2.44140625, 4.0205078125, 5.599609375, 7.1787109375, 8.7578125, 10.3369140625, 11.916015625, 13.4951171875, 15.07421875, 16.6533203125, 18.232421875, 19.8115234375, 21.390625, 22.9697265625, 24.548828125, 26.1279296875, 27.70703125, 29.2861328125, 30.865234375, 32.4443359375, 34.0234375, 35.6025390625, 37.181640625, 38.7607421875, 40.33984375, 41.9189453125, 43.498046875, 45.0771484375, 46.65625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 6.0, 4.0, 3.0, 4.0, 8.0, 5.0, 8.0, 9.0, 16.0, 13.0, 21.0, 33.0, 21.0, 34.0, 32.0, 47.0, 43.0, 47.0, 62.0, 54.0, 51.0, 55.0, 60.0, 51.0, 46.0, 41.0, 36.0, 30.0, 36.0, 23.0, 21.0, 16.0, 24.0, 11.0, 8.0, 8.0, 7.0, 7.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.8125, -20.92578125, -20.0390625, -19.15234375, -18.265625, -17.37890625, -16.4921875, -15.60546875, -14.71875, -13.83203125, -12.9453125, -12.05859375, -11.171875, -10.28515625, -9.3984375, -8.51171875, -7.625, -6.73828125, -5.8515625, -4.96484375, -4.078125, -3.19140625, -2.3046875, -1.41796875, -0.53125, 0.35546875, 1.2421875, 2.12890625, 3.015625, 3.90234375, 4.7890625, 5.67578125, 6.5625, 7.44921875, 8.3359375, 9.22265625, 10.109375, 10.99609375, 11.8828125, 12.76953125, 13.65625, 14.54296875, 15.4296875, 16.31640625, 17.203125, 18.08984375, 18.9765625, 19.86328125, 20.75, 21.63671875, 22.5234375, 23.41015625, 24.296875, 25.18359375, 26.0703125, 26.95703125, 27.84375, 28.73046875, 29.6171875, 30.50390625, 31.390625, 32.27734375, 33.1640625, 34.05078125, 34.9375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 8.0, 8.0, 7.0, 11.0, 13.0, 19.0, 24.0, 46.0, 61.0, 83.0, 134.0, 168.0, 320.0, 572.0, 1061.0, 2399.0, 6687.0, 29889.0, 288568.0, 657914.0, 45963.0, 8775.0, 2873.0, 1263.0, 627.0, 309.0, 232.0, 148.0, 91.0, 75.0, 45.0, 48.0, 27.0, 17.0, 10.0, 16.0, 7.0, 4.0, 2.0, 2.0, 6.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.15625, -55.19287109375, -53.2294921875, -51.26611328125, -49.302734375, -47.33935546875, -45.3759765625, -43.41259765625, -41.44921875, -39.48583984375, -37.5224609375, -35.55908203125, -33.595703125, -31.63232421875, -29.6689453125, -27.70556640625, -25.7421875, -23.77880859375, -21.8154296875, -19.85205078125, -17.888671875, -15.92529296875, -13.9619140625, -11.99853515625, -10.03515625, -8.07177734375, -6.1083984375, -4.14501953125, -2.181640625, -0.21826171875, 1.7451171875, 3.70849609375, 5.671875, 7.63525390625, 9.5986328125, 11.56201171875, 13.525390625, 15.48876953125, 17.4521484375, 19.41552734375, 21.37890625, 23.34228515625, 25.3056640625, 27.26904296875, 29.232421875, 31.19580078125, 33.1591796875, 35.12255859375, 37.0859375, 39.04931640625, 41.0126953125, 42.97607421875, 44.939453125, 46.90283203125, 48.8662109375, 50.82958984375, 52.79296875, 54.75634765625, 56.7197265625, 58.68310546875, 60.646484375, 62.60986328125, 64.5732421875, 66.53662109375, 68.5]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 7.0, 8.0, 10.0, 13.0, 14.0, 14.0, 26.0, 21.0, 24.0, 28.0, 49.0, 49.0, 45.0, 55.0, 54.0, 75.0, 62.0, 43.0, 51.0, 66.0, 47.0, 41.0, 33.0, 24.0, 21.0, 24.0, 15.0, 13.0, 8.0, 7.0, 11.0, 8.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-88.0625, -84.6826171875, -81.302734375, -77.9228515625, -74.54296875, -71.1630859375, -67.783203125, -64.4033203125, -61.0234375, -57.6435546875, -54.263671875, -50.8837890625, -47.50390625, -44.1240234375, -40.744140625, -37.3642578125, -33.984375, -30.6044921875, -27.224609375, -23.8447265625, -20.46484375, -17.0849609375, -13.705078125, -10.3251953125, -6.9453125, -3.5654296875, -0.185546875, 3.1943359375, 6.57421875, 9.9541015625, 13.333984375, 16.7138671875, 20.09375, 23.4736328125, 26.853515625, 30.2333984375, 33.61328125, 36.9931640625, 40.373046875, 43.7529296875, 47.1328125, 50.5126953125, 53.892578125, 57.2724609375, 60.65234375, 64.0322265625, 67.412109375, 70.7919921875, 74.171875, 77.5517578125, 80.931640625, 84.3115234375, 87.69140625, 91.0712890625, 94.451171875, 97.8310546875, 101.2109375, 104.5908203125, 107.970703125, 111.3505859375, 114.73046875, 118.1103515625, 121.490234375, 124.8701171875, 128.25]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 13.0, 11.0, 13.0, 23.0, 35.0, 48.0, 86.0, 123.0, 231.0, 366.0, 615.0, 1133.0, 2409.0, 5205.0, 13236.0, 39480.0, 157701.0, 666415.0, 111812.0, 30015.0, 10869.0, 4329.0, 2050.0, 1009.0, 527.0, 297.0, 170.0, 104.0, 81.0, 45.0, 22.0, 24.0, 18.0, 11.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -18.006591796875, -17.45068359375, -16.894775390625, -16.3388671875, -15.782958984375, -15.22705078125, -14.671142578125, -14.115234375, -13.559326171875, -13.00341796875, -12.447509765625, -11.8916015625, -11.335693359375, -10.77978515625, -10.223876953125, -9.66796875, -9.112060546875, -8.55615234375, -8.000244140625, -7.4443359375, -6.888427734375, -6.33251953125, -5.776611328125, -5.220703125, -4.664794921875, -4.10888671875, -3.552978515625, -2.9970703125, -2.441162109375, -1.88525390625, -1.329345703125, -0.7734375, -0.217529296875, 0.33837890625, 0.894287109375, 1.4501953125, 2.006103515625, 2.56201171875, 3.117919921875, 3.673828125, 4.229736328125, 4.78564453125, 5.341552734375, 5.8974609375, 6.453369140625, 7.00927734375, 7.565185546875, 8.12109375, 8.677001953125, 9.23291015625, 9.788818359375, 10.3447265625, 10.900634765625, 11.45654296875, 12.012451171875, 12.568359375, 13.124267578125, 13.68017578125, 14.236083984375, 14.7919921875, 15.347900390625, 15.90380859375, 16.459716796875, 17.015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 8.0, 17.0, 14.0, 38.0, 64.0, 82.0, 119.0, 151.0, 143.0, 93.0, 76.0, 56.0, 25.0, 34.0, 11.0, 15.0, 4.0, 12.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0059814453125, -0.005759119987487793, -0.005536794662475586, -0.005314469337463379, -0.005092144012451172, -0.004869818687438965, -0.004647493362426758, -0.004425168037414551, -0.004202842712402344, -0.003980517387390137, -0.0037581920623779297, -0.0035358667373657227, -0.0033135414123535156, -0.0030912160873413086, -0.0028688907623291016, -0.0026465654373168945, -0.0024242401123046875, -0.0022019147872924805, -0.0019795894622802734, -0.0017572641372680664, -0.0015349388122558594, -0.0013126134872436523, -0.0010902881622314453, -0.0008679628372192383, -0.0006456375122070312, -0.0004233121871948242, -0.0002009868621826172, 2.1338462829589844e-05, 0.00024366378784179688, 0.0004659891128540039, 0.0006883144378662109, 0.000910639762878418, 0.001132965087890625, 0.001355290412902832, 0.001577615737915039, 0.001799941062927246, 0.002022266387939453, 0.00224459171295166, 0.002466917037963867, 0.0026892423629760742, 0.0029115676879882812, 0.0031338930130004883, 0.0033562183380126953, 0.0035785436630249023, 0.0038008689880371094, 0.004023194313049316, 0.0042455196380615234, 0.0044678449630737305, 0.0046901702880859375, 0.0049124956130981445, 0.0051348209381103516, 0.005357146263122559, 0.005579471588134766, 0.005801796913146973, 0.00602412223815918, 0.006246447563171387, 0.006468772888183594, 0.006691098213195801, 0.006913423538208008, 0.007135748863220215, 0.007358074188232422, 0.007580399513244629, 0.007802724838256836, 0.008025050163269043, 0.00824737548828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 8.0, 12.0, 16.0, 32.0, 24.0, 61.0, 89.0, 150.0, 254.0, 517.0, 1130.0, 2813.0, 8730.0, 38753.0, 283431.0, 640454.0, 54417.0, 11465.0, 3521.0, 1359.0, 561.0, 282.0, 179.0, 94.0, 57.0, 40.0, 28.0, 23.0, 13.0, 8.0, 10.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.796875, -23.99951171875, -23.2021484375, -22.40478515625, -21.607421875, -20.81005859375, -20.0126953125, -19.21533203125, -18.41796875, -17.62060546875, -16.8232421875, -16.02587890625, -15.228515625, -14.43115234375, -13.6337890625, -12.83642578125, -12.0390625, -11.24169921875, -10.4443359375, -9.64697265625, -8.849609375, -8.05224609375, -7.2548828125, -6.45751953125, -5.66015625, -4.86279296875, -4.0654296875, -3.26806640625, -2.470703125, -1.67333984375, -0.8759765625, -0.07861328125, 0.71875, 1.51611328125, 2.3134765625, 3.11083984375, 3.908203125, 4.70556640625, 5.5029296875, 6.30029296875, 7.09765625, 7.89501953125, 8.6923828125, 9.48974609375, 10.287109375, 11.08447265625, 11.8818359375, 12.67919921875, 13.4765625, 14.27392578125, 15.0712890625, 15.86865234375, 16.666015625, 17.46337890625, 18.2607421875, 19.05810546875, 19.85546875, 20.65283203125, 21.4501953125, 22.24755859375, 23.044921875, 23.84228515625, 24.6396484375, 25.43701171875, 26.234375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 1.0, 4.0, 6.0, 6.0, 13.0, 15.0, 18.0, 43.0, 53.0, 66.0, 103.0, 120.0, 131.0, 135.0, 88.0, 63.0, 53.0, 32.0, 24.0, 6.0, 8.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.22607421875, -18.3271484375, -17.42822265625, -16.529296875, -15.63037109375, -14.7314453125, -13.83251953125, -12.93359375, -12.03466796875, -11.1357421875, -10.23681640625, -9.337890625, -8.43896484375, -7.5400390625, -6.64111328125, -5.7421875, -4.84326171875, -3.9443359375, -3.04541015625, -2.146484375, -1.24755859375, -0.3486328125, 0.55029296875, 1.44921875, 2.34814453125, 3.2470703125, 4.14599609375, 5.044921875, 5.94384765625, 6.8427734375, 7.74169921875, 8.640625, 9.53955078125, 10.4384765625, 11.33740234375, 12.236328125, 13.13525390625, 14.0341796875, 14.93310546875, 15.83203125, 16.73095703125, 17.6298828125, 18.52880859375, 19.427734375, 20.32666015625, 21.2255859375, 22.12451171875, 23.0234375, 23.92236328125, 24.8212890625, 25.72021484375, 26.619140625, 27.51806640625, 28.4169921875, 29.31591796875, 30.21484375, 31.11376953125, 32.0126953125, 32.91162109375, 33.810546875, 34.70947265625, 35.6083984375, 36.50732421875, 37.40625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 17.0, 30.0, 71.0, 115.0, 392.0, 193.0, 97.0, 42.0, 16.0, 11.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-757.6083984375, -736.9835205078125, -716.3585815429688, -695.7337036132812, -675.1087646484375, -654.48388671875, -633.8590087890625, -613.234130859375, -592.6091918945312, -571.9843139648438, -551.359375, -530.7344970703125, -510.1095886230469, -489.48468017578125, -468.85980224609375, -448.2348937988281, -427.6099853515625, -406.9850769042969, -386.36016845703125, -365.73529052734375, -345.1103820800781, -324.4854736328125, -303.860595703125, -283.2356872558594, -262.61077880859375, -241.98587036132812, -221.36097717285156, -200.736083984375, -180.11117553710938, -159.48626708984375, -138.8613739013672, -118.23648071289062, -97.61163330078125, -76.98673248291016, -56.36183166503906, -35.73693084716797, -15.112030029296875, 5.512870788574219, 26.137771606445312, 46.762664794921875, 67.3875732421875, 88.0124740600586, 108.63737487792969, 129.26226806640625, 149.88717651367188, 170.5120849609375, 191.13697814941406, 211.76187133789062, 232.38677978515625, 253.01168823242188, 273.6365966796875, 294.261474609375, 314.8863830566406, 335.51129150390625, 356.13616943359375, 376.7610778808594, 397.385986328125, 418.0108947753906, 438.63580322265625, 459.26068115234375, 479.8855895996094, 500.510498046875, 521.1353759765625, 541.76025390625, 562.3851928710938]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 7.0, 3.0, 5.0, 7.0, 10.0, 12.0, 9.0, 13.0, 16.0, 12.0, 18.0, 16.0, 30.0, 30.0, 32.0, 28.0, 35.0, 55.0, 65.0, 95.0, 100.0, 61.0, 33.0, 30.0, 31.0, 32.0, 31.0, 26.0, 20.0, 21.0, 22.0, 13.0, 9.0, 7.0, 11.0, 6.0, 9.0, 6.0, 9.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-369.95526123046875, -358.2567138671875, -346.5581359863281, -334.8595886230469, -323.1610107421875, -311.46246337890625, -299.763916015625, -288.06536865234375, -276.3667907714844, -264.6682434082031, -252.96966552734375, -241.2711181640625, -229.5725555419922, -217.87399291992188, -206.17544555664062, -194.4768829345703, -182.7783203125, -171.0797576904297, -159.38119506835938, -147.68264770507812, -135.9840850830078, -124.2855224609375, -112.58696746826172, -100.88841247558594, -89.18984985351562, -77.49128723144531, -65.79273223876953, -54.094173431396484, -42.39561462402344, -30.69705581665039, -18.998497009277344, -7.2999420166015625, 4.39862060546875, 16.097179412841797, 27.795738220214844, 39.49429702758789, 51.19285583496094, 62.891414642333984, 74.58997344970703, 86.28852844238281, 97.98709106445312, 109.68565368652344, 121.38420867919922, 133.082763671875, 144.7813262939453, 156.47988891601562, 168.17843627929688, 179.8769989013672, 191.5755615234375, 203.2741241455078, 214.97268676757812, 226.67123413085938, 238.3697967529297, 250.068359375, 261.76690673828125, 273.4654541015625, 285.1640319824219, 296.8625793457031, 308.5611572265625, 320.25970458984375, 331.958251953125, 343.6568298339844, 355.3553771972656, 367.053955078125, 378.75250244140625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 11.0, 8.0, 15.0, 20.0, 22.0, 54.0, 70.0, 86.0, 107.0, 197.0, 300.0, 408.0, 744.0, 1280.0, 2338.0, 4668.0, 10641.0, 27352.0, 84758.0, 327629.0, 1313770.0, 1754206.0, 486563.0, 118230.0, 35122.0, 13036.0, 5713.0, 2792.0, 1574.0, 959.0, 519.0, 366.0, 225.0, 164.0, 95.0, 75.0, 42.0, 29.0, 28.0, 19.0, 9.0, 10.0, 7.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.639404296875, -22.90380859375, -22.168212890625, -21.4326171875, -20.697021484375, -19.96142578125, -19.225830078125, -18.490234375, -17.754638671875, -17.01904296875, -16.283447265625, -15.5478515625, -14.812255859375, -14.07666015625, -13.341064453125, -12.60546875, -11.869873046875, -11.13427734375, -10.398681640625, -9.6630859375, -8.927490234375, -8.19189453125, -7.456298828125, -6.720703125, -5.985107421875, -5.24951171875, -4.513916015625, -3.7783203125, -3.042724609375, -2.30712890625, -1.571533203125, -0.8359375, -0.100341796875, 0.63525390625, 1.370849609375, 2.1064453125, 2.842041015625, 3.57763671875, 4.313232421875, 5.048828125, 5.784423828125, 6.52001953125, 7.255615234375, 7.9912109375, 8.726806640625, 9.46240234375, 10.197998046875, 10.93359375, 11.669189453125, 12.40478515625, 13.140380859375, 13.8759765625, 14.611572265625, 15.34716796875, 16.082763671875, 16.818359375, 17.553955078125, 18.28955078125, 19.025146484375, 19.7607421875, 20.496337890625, 21.23193359375, 21.967529296875, 22.703125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 10.0, 8.0, 12.0, 13.0, 15.0, 24.0, 32.0, 25.0, 34.0, 39.0, 49.0, 39.0, 57.0, 39.0, 38.0, 51.0, 43.0, 49.0, 44.0, 52.0, 54.0, 36.0, 31.0, 18.0, 29.0, 28.0, 28.0, 15.0, 15.0, 24.0, 4.0, 4.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-24.875, -24.06884765625, -23.2626953125, -22.45654296875, -21.650390625, -20.84423828125, -20.0380859375, -19.23193359375, -18.42578125, -17.61962890625, -16.8134765625, -16.00732421875, -15.201171875, -14.39501953125, -13.5888671875, -12.78271484375, -11.9765625, -11.17041015625, -10.3642578125, -9.55810546875, -8.751953125, -7.94580078125, -7.1396484375, -6.33349609375, -5.52734375, -4.72119140625, -3.9150390625, -3.10888671875, -2.302734375, -1.49658203125, -0.6904296875, 0.11572265625, 0.921875, 1.72802734375, 2.5341796875, 3.34033203125, 4.146484375, 4.95263671875, 5.7587890625, 6.56494140625, 7.37109375, 8.17724609375, 8.9833984375, 9.78955078125, 10.595703125, 11.40185546875, 12.2080078125, 13.01416015625, 13.8203125, 14.62646484375, 15.4326171875, 16.23876953125, 17.044921875, 17.85107421875, 18.6572265625, 19.46337890625, 20.26953125, 21.07568359375, 21.8818359375, 22.68798828125, 23.494140625, 24.30029296875, 25.1064453125, 25.91259765625, 26.71875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 16.0, 13.0, 23.0, 27.0, 33.0, 63.0, 114.0, 225.0, 528.0, 1635.0, 5941.0, 35908.0, 817598.0, 3223632.0, 93236.0, 11065.0, 2675.0, 858.0, 308.0, 155.0, 73.0, 45.0, 32.0, 14.0, 14.0, 8.0, 8.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-79.8125, -77.478515625, -75.14453125, -72.810546875, -70.4765625, -68.142578125, -65.80859375, -63.474609375, -61.140625, -58.806640625, -56.47265625, -54.138671875, -51.8046875, -49.470703125, -47.13671875, -44.802734375, -42.46875, -40.134765625, -37.80078125, -35.466796875, -33.1328125, -30.798828125, -28.46484375, -26.130859375, -23.796875, -21.462890625, -19.12890625, -16.794921875, -14.4609375, -12.126953125, -9.79296875, -7.458984375, -5.125, -2.791015625, -0.45703125, 1.876953125, 4.2109375, 6.544921875, 8.87890625, 11.212890625, 13.546875, 15.880859375, 18.21484375, 20.548828125, 22.8828125, 25.216796875, 27.55078125, 29.884765625, 32.21875, 34.552734375, 36.88671875, 39.220703125, 41.5546875, 43.888671875, 46.22265625, 48.556640625, 50.890625, 53.224609375, 55.55859375, 57.892578125, 60.2265625, 62.560546875, 64.89453125, 67.228515625, 69.5625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 7.0, 18.0, 20.0, 32.0, 32.0, 50.0, 64.0, 128.0, 181.0, 262.0, 450.0, 596.0, 663.0, 546.0, 350.0, 201.0, 143.0, 91.0, 74.0, 46.0, 26.0, 26.0, 8.0, 5.0, 5.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-62.0, -60.287109375, -58.57421875, -56.861328125, -55.1484375, -53.435546875, -51.72265625, -50.009765625, -48.296875, -46.583984375, -44.87109375, -43.158203125, -41.4453125, -39.732421875, -38.01953125, -36.306640625, -34.59375, -32.880859375, -31.16796875, -29.455078125, -27.7421875, -26.029296875, -24.31640625, -22.603515625, -20.890625, -19.177734375, -17.46484375, -15.751953125, -14.0390625, -12.326171875, -10.61328125, -8.900390625, -7.1875, -5.474609375, -3.76171875, -2.048828125, -0.3359375, 1.376953125, 3.08984375, 4.802734375, 6.515625, 8.228515625, 9.94140625, 11.654296875, 13.3671875, 15.080078125, 16.79296875, 18.505859375, 20.21875, 21.931640625, 23.64453125, 25.357421875, 27.0703125, 28.783203125, 30.49609375, 32.208984375, 33.921875, 35.634765625, 37.34765625, 39.060546875, 40.7734375, 42.486328125, 44.19921875, 45.912109375, 47.625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 9.0, 11.0, 28.0, 45.0, 145.0, 279.0, 240.0, 146.0, 61.0, 14.0, 17.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-567.9182739257812, -543.019775390625, -518.1212768554688, -493.2228088378906, -468.3243103027344, -443.4258117675781, -418.52734375, -393.62884521484375, -368.7303466796875, -343.83184814453125, -318.933349609375, -294.0348815917969, -269.1363830566406, -244.23788452148438, -219.3394012451172, -194.44091796875, -169.54241943359375, -144.6439208984375, -119.74543762207031, -94.8469467163086, -69.94845581054688, -45.049964904785156, -20.151473999023438, 4.74700927734375, 29.6455078125, 54.54399871826172, 79.44248962402344, 104.34098052978516, 129.23947143554688, 154.13796997070312, 179.0364532470703, 203.9349365234375, 228.83349609375, 253.73199462890625, 278.6304931640625, 303.5289611816406, 328.4274597167969, 353.3259582519531, 378.22442626953125, 403.1229248046875, 428.02142333984375, 452.919921875, 477.81842041015625, 502.7168884277344, 527.6153564453125, 552.5138549804688, 577.412353515625, 602.3108520507812, 627.2093505859375, 652.1078491210938, 677.00634765625, 701.9048461914062, 726.8033447265625, 751.7017822265625, 776.6002807617188, 801.498779296875, 826.3972778320312, 851.2957763671875, 876.1942749023438, 901.0927734375, 925.9912109375, 950.8897094726562, 975.7882080078125, 1000.6867065429688, 1025.585205078125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 10.0, 8.0, 13.0, 11.0, 14.0, 14.0, 23.0, 28.0, 29.0, 39.0, 41.0, 49.0, 65.0, 40.0, 72.0, 63.0, 79.0, 47.0, 46.0, 55.0, 53.0, 35.0, 26.0, 20.0, 21.0, 20.0, 20.0, 12.0, 13.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-333.4386901855469, -324.39263916015625, -315.34661865234375, -306.3005676269531, -297.2545471191406, -288.20849609375, -279.1624755859375, -270.1164245605469, -261.07037353515625, -252.0243377685547, -242.97830200195312, -233.93226623535156, -224.88623046875, -215.84017944335938, -206.7941436767578, -197.74810791015625, -188.70208740234375, -179.6560516357422, -170.61001586914062, -161.56398010253906, -152.5179443359375, -143.47189331054688, -134.4258575439453, -125.37982177734375, -116.33378601074219, -107.28775024414062, -98.24171447753906, -89.19567108154297, -80.1496353149414, -71.10359954833984, -62.057559967041016, -53.01152038574219, -43.96551513671875, -34.91947937011719, -25.87343978881836, -16.827402114868164, -7.781364440917969, 1.2646713256835938, 10.310710906982422, 19.35675048828125, 28.402786254882812, 37.448822021484375, 46.4948616027832, 55.54090118408203, 64.5869369506836, 73.63297271728516, 82.67901611328125, 91.72505187988281, 100.77108764648438, 109.81712341308594, 118.8631591796875, 127.9092025756836, 136.95523071289062, 146.00128173828125, 155.0473175048828, 164.09335327148438, 173.13938903808594, 182.1854248046875, 191.23146057128906, 200.27749633789062, 209.32354736328125, 218.36956787109375, 227.41561889648438, 236.46165466308594, 245.5076904296875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 6.0, 17.0, 13.0, 19.0, 46.0, 45.0, 89.0, 96.0, 146.0, 234.0, 352.0, 554.0, 951.0, 1643.0, 2985.0, 5808.0, 12425.0, 28890.0, 76342.0, 235419.0, 415647.0, 167766.0, 56291.0, 21992.0, 9875.0, 4682.0, 2526.0, 1376.0, 831.0, 537.0, 334.0, 211.0, 112.0, 89.0, 56.0, 44.0, 28.0, 20.0, 8.0, 7.0, 14.0, 8.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0], "bins": [-34.59375, -33.615234375, -32.63671875, -31.658203125, -30.6796875, -29.701171875, -28.72265625, -27.744140625, -26.765625, -25.787109375, -24.80859375, -23.830078125, -22.8515625, -21.873046875, -20.89453125, -19.916015625, -18.9375, -17.958984375, -16.98046875, -16.001953125, -15.0234375, -14.044921875, -13.06640625, -12.087890625, -11.109375, -10.130859375, -9.15234375, -8.173828125, -7.1953125, -6.216796875, -5.23828125, -4.259765625, -3.28125, -2.302734375, -1.32421875, -0.345703125, 0.6328125, 1.611328125, 2.58984375, 3.568359375, 4.546875, 5.525390625, 6.50390625, 7.482421875, 8.4609375, 9.439453125, 10.41796875, 11.396484375, 12.375, 13.353515625, 14.33203125, 15.310546875, 16.2890625, 17.267578125, 18.24609375, 19.224609375, 20.203125, 21.181640625, 22.16015625, 23.138671875, 24.1171875, 25.095703125, 26.07421875, 27.052734375, 28.03125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 7.0, 13.0, 8.0, 11.0, 9.0, 15.0, 15.0, 27.0, 33.0, 31.0, 30.0, 31.0, 31.0, 30.0, 42.0, 51.0, 53.0, 46.0, 65.0, 38.0, 53.0, 41.0, 38.0, 40.0, 27.0, 34.0, 29.0, 25.0, 23.0, 19.0, 18.0, 11.0, 12.0, 5.0, 5.0, 10.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.609375, -24.807373046875, -24.00537109375, -23.203369140625, -22.4013671875, -21.599365234375, -20.79736328125, -19.995361328125, -19.193359375, -18.391357421875, -17.58935546875, -16.787353515625, -15.9853515625, -15.183349609375, -14.38134765625, -13.579345703125, -12.77734375, -11.975341796875, -11.17333984375, -10.371337890625, -9.5693359375, -8.767333984375, -7.96533203125, -7.163330078125, -6.361328125, -5.559326171875, -4.75732421875, -3.955322265625, -3.1533203125, -2.351318359375, -1.54931640625, -0.747314453125, 0.0546875, 0.856689453125, 1.65869140625, 2.460693359375, 3.2626953125, 4.064697265625, 4.86669921875, 5.668701171875, 6.470703125, 7.272705078125, 8.07470703125, 8.876708984375, 9.6787109375, 10.480712890625, 11.28271484375, 12.084716796875, 12.88671875, 13.688720703125, 14.49072265625, 15.292724609375, 16.0947265625, 16.896728515625, 17.69873046875, 18.500732421875, 19.302734375, 20.104736328125, 20.90673828125, 21.708740234375, 22.5107421875, 23.312744140625, 24.11474609375, 24.916748046875, 25.71875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 8.0, 11.0, 11.0, 8.0, 15.0, 21.0, 33.0, 55.0, 65.0, 99.0, 150.0, 247.0, 380.0, 638.0, 1185.0, 2620.0, 7874.0, 32622.0, 244733.0, 685406.0, 54002.0, 11361.0, 3568.0, 1433.0, 757.0, 441.0, 268.0, 154.0, 108.0, 69.0, 56.0, 41.0, 21.0, 29.0, 19.0, 12.0, 8.0, 11.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-68.8125, -66.90869140625, -65.0048828125, -63.10107421875, -61.197265625, -59.29345703125, -57.3896484375, -55.48583984375, -53.58203125, -51.67822265625, -49.7744140625, -47.87060546875, -45.966796875, -44.06298828125, -42.1591796875, -40.25537109375, -38.3515625, -36.44775390625, -34.5439453125, -32.64013671875, -30.736328125, -28.83251953125, -26.9287109375, -25.02490234375, -23.12109375, -21.21728515625, -19.3134765625, -17.40966796875, -15.505859375, -13.60205078125, -11.6982421875, -9.79443359375, -7.890625, -5.98681640625, -4.0830078125, -2.17919921875, -0.275390625, 1.62841796875, 3.5322265625, 5.43603515625, 7.33984375, 9.24365234375, 11.1474609375, 13.05126953125, 14.955078125, 16.85888671875, 18.7626953125, 20.66650390625, 22.5703125, 24.47412109375, 26.3779296875, 28.28173828125, 30.185546875, 32.08935546875, 33.9931640625, 35.89697265625, 37.80078125, 39.70458984375, 41.6083984375, 43.51220703125, 45.416015625, 47.31982421875, 49.2236328125, 51.12744140625, 53.03125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 4.0, 9.0, 10.0, 11.0, 8.0, 10.0, 15.0, 20.0, 23.0, 28.0, 31.0, 32.0, 47.0, 66.0, 62.0, 59.0, 51.0, 70.0, 62.0, 54.0, 43.0, 39.0, 52.0, 35.0, 37.0, 23.0, 22.0, 27.0, 11.0, 6.0, 6.0, 5.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.9375, -119.314453125, -115.69140625, -112.068359375, -108.4453125, -104.822265625, -101.19921875, -97.576171875, -93.953125, -90.330078125, -86.70703125, -83.083984375, -79.4609375, -75.837890625, -72.21484375, -68.591796875, -64.96875, -61.345703125, -57.72265625, -54.099609375, -50.4765625, -46.853515625, -43.23046875, -39.607421875, -35.984375, -32.361328125, -28.73828125, -25.115234375, -21.4921875, -17.869140625, -14.24609375, -10.623046875, -7.0, -3.376953125, 0.24609375, 3.869140625, 7.4921875, 11.115234375, 14.73828125, 18.361328125, 21.984375, 25.607421875, 29.23046875, 32.853515625, 36.4765625, 40.099609375, 43.72265625, 47.345703125, 50.96875, 54.591796875, 58.21484375, 61.837890625, 65.4609375, 69.083984375, 72.70703125, 76.330078125, 79.953125, 83.576171875, 87.19921875, 90.822265625, 94.4453125, 98.068359375, 101.69140625, 105.314453125, 108.9375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 13.0, 18.0, 20.0, 17.0, 29.0, 58.0, 77.0, 117.0, 159.0, 253.0, 459.0, 810.0, 1485.0, 3573.0, 8813.0, 25907.0, 98260.0, 663532.0, 180406.0, 41784.0, 13063.0, 5013.0, 2167.0, 996.0, 593.0, 339.0, 196.0, 128.0, 63.0, 63.0, 43.0, 28.0, 20.0, 13.0, 6.0, 5.0, 6.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6796875, -10.2471923828125, -9.814697265625, -9.3822021484375, -8.94970703125, -8.5172119140625, -8.084716796875, -7.6522216796875, -7.2197265625, -6.7872314453125, -6.354736328125, -5.9222412109375, -5.48974609375, -5.0572509765625, -4.624755859375, -4.1922607421875, -3.759765625, -3.3272705078125, -2.894775390625, -2.4622802734375, -2.02978515625, -1.5972900390625, -1.164794921875, -0.7322998046875, -0.2998046875, 0.1326904296875, 0.565185546875, 0.9976806640625, 1.43017578125, 1.8626708984375, 2.295166015625, 2.7276611328125, 3.16015625, 3.5926513671875, 4.025146484375, 4.4576416015625, 4.89013671875, 5.3226318359375, 5.755126953125, 6.1876220703125, 6.6201171875, 7.0526123046875, 7.485107421875, 7.9176025390625, 8.35009765625, 8.7825927734375, 9.215087890625, 9.6475830078125, 10.080078125, 10.5125732421875, 10.945068359375, 11.3775634765625, 11.81005859375, 12.2425537109375, 12.675048828125, 13.1075439453125, 13.5400390625, 13.9725341796875, 14.405029296875, 14.8375244140625, 15.27001953125, 15.7025146484375, 16.135009765625, 16.5675048828125, 17.0]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 8.0, 6.0, 15.0, 21.0, 17.0, 39.0, 56.0, 87.0, 104.0, 116.0, 136.0, 98.0, 77.0, 57.0, 39.0, 23.0, 26.0, 14.0, 13.0, 6.0, 6.0, 4.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004940032958984375, -0.004775106906890869, -0.004610180854797363, -0.004445254802703857, -0.0042803287506103516, -0.004115402698516846, -0.00395047664642334, -0.003785550594329834, -0.003620624542236328, -0.0034556984901428223, -0.0032907724380493164, -0.0031258463859558105, -0.0029609203338623047, -0.002795994281768799, -0.002631068229675293, -0.002466142177581787, -0.0023012161254882812, -0.0021362900733947754, -0.0019713640213012695, -0.0018064379692077637, -0.0016415119171142578, -0.001476585865020752, -0.001311659812927246, -0.0011467337608337402, -0.0009818077087402344, -0.0008168816566467285, -0.0006519556045532227, -0.0004870295524597168, -0.00032210350036621094, -0.00015717744827270508, 7.748603820800781e-06, 0.00017267465591430664, 0.0003376007080078125, 0.0005025267601013184, 0.0006674528121948242, 0.0008323788642883301, 0.000997304916381836, 0.0011622309684753418, 0.0013271570205688477, 0.0014920830726623535, 0.0016570091247558594, 0.0018219351768493652, 0.001986861228942871, 0.002151787281036377, 0.002316713333129883, 0.0024816393852233887, 0.0026465654373168945, 0.0028114914894104004, 0.0029764175415039062, 0.003141343593597412, 0.003306269645690918, 0.003471195697784424, 0.0036361217498779297, 0.0038010478019714355, 0.003965973854064941, 0.004130899906158447, 0.004295825958251953, 0.004460752010345459, 0.004625678062438965, 0.004790604114532471, 0.0049555301666259766, 0.005120456218719482, 0.005285382270812988, 0.005450308322906494, 0.005615234375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 17.0, 17.0, 27.0, 48.0, 68.0, 147.0, 263.0, 524.0, 1263.0, 3460.0, 14173.0, 88847.0, 781318.0, 132574.0, 18674.0, 4418.0, 1443.0, 590.0, 307.0, 176.0, 76.0, 44.0, 25.0, 15.0, 14.0, 7.0, 8.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.90625, -25.1982421875, -24.490234375, -23.7822265625, -23.07421875, -22.3662109375, -21.658203125, -20.9501953125, -20.2421875, -19.5341796875, -18.826171875, -18.1181640625, -17.41015625, -16.7021484375, -15.994140625, -15.2861328125, -14.578125, -13.8701171875, -13.162109375, -12.4541015625, -11.74609375, -11.0380859375, -10.330078125, -9.6220703125, -8.9140625, -8.2060546875, -7.498046875, -6.7900390625, -6.08203125, -5.3740234375, -4.666015625, -3.9580078125, -3.25, -2.5419921875, -1.833984375, -1.1259765625, -0.41796875, 0.2900390625, 0.998046875, 1.7060546875, 2.4140625, 3.1220703125, 3.830078125, 4.5380859375, 5.24609375, 5.9541015625, 6.662109375, 7.3701171875, 8.078125, 8.7861328125, 9.494140625, 10.2021484375, 10.91015625, 11.6181640625, 12.326171875, 13.0341796875, 13.7421875, 14.4501953125, 15.158203125, 15.8662109375, 16.57421875, 17.2822265625, 17.990234375, 18.6982421875, 19.40625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 7.0, 7.0, 9.0, 8.0, 6.0, 6.0, 17.0, 13.0, 26.0, 25.0, 38.0, 44.0, 57.0, 70.0, 71.0, 67.0, 68.0, 60.0, 65.0, 63.0, 59.0, 35.0, 31.0, 30.0, 21.0, 13.0, 19.0, 5.0, 9.0, 5.0, 7.0, 4.0, 2.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-15.5, -15.02783203125, -14.5556640625, -14.08349609375, -13.611328125, -13.13916015625, -12.6669921875, -12.19482421875, -11.72265625, -11.25048828125, -10.7783203125, -10.30615234375, -9.833984375, -9.36181640625, -8.8896484375, -8.41748046875, -7.9453125, -7.47314453125, -7.0009765625, -6.52880859375, -6.056640625, -5.58447265625, -5.1123046875, -4.64013671875, -4.16796875, -3.69580078125, -3.2236328125, -2.75146484375, -2.279296875, -1.80712890625, -1.3349609375, -0.86279296875, -0.390625, 0.08154296875, 0.5537109375, 1.02587890625, 1.498046875, 1.97021484375, 2.4423828125, 2.91455078125, 3.38671875, 3.85888671875, 4.3310546875, 4.80322265625, 5.275390625, 5.74755859375, 6.2197265625, 6.69189453125, 7.1640625, 7.63623046875, 8.1083984375, 8.58056640625, 9.052734375, 9.52490234375, 9.9970703125, 10.46923828125, 10.94140625, 11.41357421875, 11.8857421875, 12.35791015625, 12.830078125, 13.30224609375, 13.7744140625, 14.24658203125, 14.71875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 14.0, 38.0, 83.0, 171.0, 403.0, 142.0, 72.0, 38.0, 18.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-531.448974609375, -510.46685791015625, -489.4847412109375, -468.50262451171875, -447.5205078125, -426.53839111328125, -405.5562744140625, -384.57415771484375, -363.592041015625, -342.60992431640625, -321.6278076171875, -300.64569091796875, -279.66357421875, -258.68145751953125, -237.69935607910156, -216.7172393798828, -195.73513793945312, -174.75302124023438, -153.77090454101562, -132.78878784179688, -111.80667877197266, -90.8245620727539, -69.84245300292969, -48.86033630371094, -27.878219604492188, -6.89610481262207, 14.086009979248047, 35.06812286376953, 56.05023956298828, 77.03235626220703, 98.01446533203125, 118.99658203125, 139.97869873046875, 160.9608154296875, 181.94293212890625, 202.925048828125, 223.90716552734375, 244.8892822265625, 265.87139892578125, 286.853515625, 307.83563232421875, 328.8177490234375, 349.79986572265625, 370.781982421875, 391.76409912109375, 412.7462158203125, 433.72833251953125, 454.71044921875, 475.6925354003906, 496.6746520996094, 517.65673828125, 538.6388549804688, 559.6209716796875, 580.6030883789062, 601.585205078125, 622.5673217773438, 643.5494384765625, 664.5315551757812, 685.513671875, 706.4957885742188, 727.4779052734375, 748.4600219726562, 769.442138671875, 790.4242553710938, 811.4063720703125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 6.0, 14.0, 17.0, 23.0, 22.0, 16.0, 21.0, 31.0, 30.0, 31.0, 39.0, 75.0, 114.0, 126.0, 80.0, 37.0, 29.0, 26.0, 32.0, 32.0, 22.0, 28.0, 11.0, 16.0, 17.0, 18.0, 12.0, 5.0, 7.0, 6.0, 4.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.53582763671875, -322.13092041015625, -310.7260437011719, -299.3211364746094, -287.9162292480469, -276.5113525390625, -265.1064453125, -253.7015380859375, -242.29664611816406, -230.89175415039062, -219.48684692382812, -208.0819549560547, -196.67706298828125, -185.27215576171875, -173.8672637939453, -162.46237182617188, -151.05746459960938, -139.65257263183594, -128.24766540527344, -116.8427734375, -105.43787384033203, -94.03297424316406, -82.62808227539062, -71.22318267822266, -59.81828308105469, -48.41338348388672, -37.008487701416016, -25.603591918945312, -14.198692321777344, -2.793792724609375, 8.611099243164062, 20.01599884033203, 31.420928955078125, 42.825828552246094, 54.2307243347168, 65.6356201171875, 77.04051971435547, 88.44541931152344, 99.85031127929688, 111.25521087646484, 122.66011047363281, 134.06500244140625, 145.46990966796875, 156.8748016357422, 168.27969360351562, 179.68460083007812, 191.08949279785156, 202.494384765625, 213.8992919921875, 225.30418395996094, 236.70909118652344, 248.11398315429688, 259.5188903808594, 270.92376708984375, 282.32867431640625, 293.73358154296875, 305.13848876953125, 316.54339599609375, 327.9482727050781, 339.3531799316406, 350.7580871582031, 362.1629638671875, 373.56787109375, 384.9727783203125, 396.3776550292969]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 9.0, 3.0, 6.0, 6.0, 12.0, 13.0, 15.0, 21.0, 43.0, 42.0, 71.0, 109.0, 132.0, 211.0, 324.0, 542.0, 901.0, 1557.0, 2799.0, 5423.0, 11198.0, 25480.0, 67754.0, 213729.0, 723713.0, 1698196.0, 992253.0, 298934.0, 89550.0, 32065.0, 14008.0, 6681.0, 3480.0, 1932.0, 1133.0, 681.0, 441.0, 265.0, 201.0, 101.0, 86.0, 64.0, 34.0, 24.0, 17.0, 11.0, 6.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.8359375, -30.796875, -29.7578125, -28.71875, -27.6796875, -26.640625, -25.6015625, -24.5625, -23.5234375, -22.484375, -21.4453125, -20.40625, -19.3671875, -18.328125, -17.2890625, -16.25, -15.2109375, -14.171875, -13.1328125, -12.09375, -11.0546875, -10.015625, -8.9765625, -7.9375, -6.8984375, -5.859375, -4.8203125, -3.78125, -2.7421875, -1.703125, -0.6640625, 0.375, 1.4140625, 2.453125, 3.4921875, 4.53125, 5.5703125, 6.609375, 7.6484375, 8.6875, 9.7265625, 10.765625, 11.8046875, 12.84375, 13.8828125, 14.921875, 15.9609375, 17.0, 18.0390625, 19.078125, 20.1171875, 21.15625, 22.1953125, 23.234375, 24.2734375, 25.3125, 26.3515625, 27.390625, 28.4296875, 29.46875, 30.5078125, 31.546875, 32.5859375, 33.625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 11.0, 17.0, 15.0, 17.0, 19.0, 20.0, 18.0, 19.0, 41.0, 34.0, 43.0, 36.0, 33.0, 48.0, 43.0, 58.0, 35.0, 48.0, 52.0, 43.0, 35.0, 43.0, 29.0, 36.0, 25.0, 25.0, 35.0, 14.0, 14.0, 16.0, 13.0, 11.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-22.21875, -21.488037109375, -20.75732421875, -20.026611328125, -19.2958984375, -18.565185546875, -17.83447265625, -17.103759765625, -16.373046875, -15.642333984375, -14.91162109375, -14.180908203125, -13.4501953125, -12.719482421875, -11.98876953125, -11.258056640625, -10.52734375, -9.796630859375, -9.06591796875, -8.335205078125, -7.6044921875, -6.873779296875, -6.14306640625, -5.412353515625, -4.681640625, -3.950927734375, -3.22021484375, -2.489501953125, -1.7587890625, -1.028076171875, -0.29736328125, 0.433349609375, 1.1640625, 1.894775390625, 2.62548828125, 3.356201171875, 4.0869140625, 4.817626953125, 5.54833984375, 6.279052734375, 7.009765625, 7.740478515625, 8.47119140625, 9.201904296875, 9.9326171875, 10.663330078125, 11.39404296875, 12.124755859375, 12.85546875, 13.586181640625, 14.31689453125, 15.047607421875, 15.7783203125, 16.509033203125, 17.23974609375, 17.970458984375, 18.701171875, 19.431884765625, 20.16259765625, 20.893310546875, 21.6240234375, 22.354736328125, 23.08544921875, 23.816162109375, 24.546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 9.0, 7.0, 10.0, 8.0, 14.0, 35.0, 24.0, 72.0, 75.0, 147.0, 273.0, 555.0, 1291.0, 4425.0, 44818.0, 3850953.0, 278055.0, 9910.0, 2044.0, 710.0, 371.0, 196.0, 110.0, 52.0, 40.0, 25.0, 22.0, 14.0, 10.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.875, -161.44140625, -156.0078125, -150.57421875, -145.140625, -139.70703125, -134.2734375, -128.83984375, -123.40625, -117.97265625, -112.5390625, -107.10546875, -101.671875, -96.23828125, -90.8046875, -85.37109375, -79.9375, -74.50390625, -69.0703125, -63.63671875, -58.203125, -52.76953125, -47.3359375, -41.90234375, -36.46875, -31.03515625, -25.6015625, -20.16796875, -14.734375, -9.30078125, -3.8671875, 1.56640625, 7.0, 12.43359375, 17.8671875, 23.30078125, 28.734375, 34.16796875, 39.6015625, 45.03515625, 50.46875, 55.90234375, 61.3359375, 66.76953125, 72.203125, 77.63671875, 83.0703125, 88.50390625, 93.9375, 99.37109375, 104.8046875, 110.23828125, 115.671875, 121.10546875, 126.5390625, 131.97265625, 137.40625, 142.83984375, 148.2734375, 153.70703125, 159.140625, 164.57421875, 170.0078125, 175.44140625, 180.875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 12.0, 11.0, 9.0, 10.0, 17.0, 26.0, 29.0, 41.0, 56.0, 76.0, 83.0, 127.0, 175.0, 217.0, 273.0, 394.0, 450.0, 491.0, 355.0, 320.0, 187.0, 173.0, 132.0, 108.0, 66.0, 58.0, 26.0, 36.0, 30.0, 23.0, 12.0, 11.0, 8.0, 7.0, 6.0, 3.0, 3.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-75.625, -73.4677734375, -71.310546875, -69.1533203125, -66.99609375, -64.8388671875, -62.681640625, -60.5244140625, -58.3671875, -56.2099609375, -54.052734375, -51.8955078125, -49.73828125, -47.5810546875, -45.423828125, -43.2666015625, -41.109375, -38.9521484375, -36.794921875, -34.6376953125, -32.48046875, -30.3232421875, -28.166015625, -26.0087890625, -23.8515625, -21.6943359375, -19.537109375, -17.3798828125, -15.22265625, -13.0654296875, -10.908203125, -8.7509765625, -6.59375, -4.4365234375, -2.279296875, -0.1220703125, 2.03515625, 4.1923828125, 6.349609375, 8.5068359375, 10.6640625, 12.8212890625, 14.978515625, 17.1357421875, 19.29296875, 21.4501953125, 23.607421875, 25.7646484375, 27.921875, 30.0791015625, 32.236328125, 34.3935546875, 36.55078125, 38.7080078125, 40.865234375, 43.0224609375, 45.1796875, 47.3369140625, 49.494140625, 51.6513671875, 53.80859375, 55.9658203125, 58.123046875, 60.2802734375, 62.4375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 13.0, 18.0, 25.0, 58.0, 73.0, 114.0, 154.0, 155.0, 126.0, 98.0, 54.0, 41.0, 14.0, 13.0, 12.0, 6.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-676.854736328125, -648.73486328125, -620.614990234375, -592.4951782226562, -564.3753051757812, -536.2554321289062, -508.13555908203125, -480.0157165527344, -451.8958740234375, -423.7760009765625, -395.6561584472656, -367.5362854003906, -339.41644287109375, -311.29656982421875, -283.17669677734375, -255.05685424804688, -226.93698120117188, -198.81712341308594, -170.697265625, -142.577392578125, -114.4575424194336, -86.33767700195312, -58.21781921386719, -30.09796142578125, -1.9781036376953125, 26.141756057739258, 54.26161575317383, 82.38147735595703, 110.50133514404297, 138.62120056152344, 166.74105834960938, 194.8609161376953, 222.98077392578125, 251.1006317138672, 279.2204895019531, 307.3403625488281, 335.460205078125, 363.580078125, 391.699951171875, 419.8197937011719, 447.93963623046875, 476.05950927734375, 504.1793518066406, 532.2991943359375, 560.4190673828125, 588.5389404296875, 616.6588134765625, 644.7786865234375, 672.8985595703125, 701.0184326171875, 729.1383056640625, 757.2581176757812, 785.3779907226562, 813.4978637695312, 841.6177368164062, 869.737548828125, 897.857421875, 925.977294921875, 954.09716796875, 982.2169799804688, 1010.3368530273438, 1038.456787109375, 1066.5765380859375, 1094.6964111328125, 1122.8162841796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 1.0, 0.0, 6.0, 3.0, 3.0, 8.0, 5.0, 14.0, 16.0, 14.0, 22.0, 23.0, 30.0, 31.0, 28.0, 29.0, 43.0, 49.0, 55.0, 45.0, 44.0, 53.0, 56.0, 63.0, 42.0, 34.0, 35.0, 35.0, 28.0, 28.0, 26.0, 12.0, 25.0, 14.0, 26.0, 6.0, 6.0, 9.0, 6.0, 8.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-422.91131591796875, -408.9854431152344, -395.0595703125, -381.13372802734375, -367.2078552246094, -353.281982421875, -339.3561096191406, -325.43023681640625, -311.50439453125, -297.5785217285156, -283.65264892578125, -269.726806640625, -255.80093383789062, -241.87506103515625, -227.94918823242188, -214.0233154296875, -200.09744262695312, -186.17156982421875, -172.24571228027344, -158.31983947753906, -144.39398193359375, -130.46810913085938, -116.542236328125, -102.61637115478516, -88.69050598144531, -74.76464080810547, -60.83877182006836, -46.91290283203125, -32.987037658691406, -19.061172485351562, -5.1352996826171875, 8.790565490722656, 22.7164306640625, 36.642295837402344, 50.56816482543945, 64.49403381347656, 78.4198989868164, 92.34576416015625, 106.27163696289062, 120.19750213623047, 134.1233673095703, 148.0492401123047, 161.97509765625, 175.90097045898438, 189.82684326171875, 203.75270080566406, 217.67857360839844, 231.60443115234375, 245.53030395507812, 259.4561767578125, 273.3820495605469, 287.30792236328125, 301.2337646484375, 315.1596374511719, 329.08551025390625, 343.0113830566406, 356.937255859375, 370.8631286621094, 384.78900146484375, 398.71484375, 412.6407165527344, 426.56658935546875, 440.4924621582031, 454.4183349609375, 468.34417724609375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 9.0, 20.0, 32.0, 38.0, 47.0, 85.0, 132.0, 197.0, 318.0, 511.0, 797.0, 1446.0, 2760.0, 5751.0, 12864.0, 33309.0, 103946.0, 403788.0, 340734.0, 89456.0, 29500.0, 11497.0, 5245.0, 2577.0, 1340.0, 793.0, 514.0, 304.0, 203.0, 101.0, 82.0, 48.0, 23.0, 30.0, 17.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.46875, -35.2900390625, -34.111328125, -32.9326171875, -31.75390625, -30.5751953125, -29.396484375, -28.2177734375, -27.0390625, -25.8603515625, -24.681640625, -23.5029296875, -22.32421875, -21.1455078125, -19.966796875, -18.7880859375, -17.609375, -16.4306640625, -15.251953125, -14.0732421875, -12.89453125, -11.7158203125, -10.537109375, -9.3583984375, -8.1796875, -7.0009765625, -5.822265625, -4.6435546875, -3.46484375, -2.2861328125, -1.107421875, 0.0712890625, 1.25, 2.4287109375, 3.607421875, 4.7861328125, 5.96484375, 7.1435546875, 8.322265625, 9.5009765625, 10.6796875, 11.8583984375, 13.037109375, 14.2158203125, 15.39453125, 16.5732421875, 17.751953125, 18.9306640625, 20.109375, 21.2880859375, 22.466796875, 23.6455078125, 24.82421875, 26.0029296875, 27.181640625, 28.3603515625, 29.5390625, 30.7177734375, 31.896484375, 33.0751953125, 34.25390625, 35.4326171875, 36.611328125, 37.7900390625, 38.96875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 9.0, 8.0, 9.0, 20.0, 22.0, 33.0, 34.0, 42.0, 58.0, 59.0, 65.0, 78.0, 80.0, 93.0, 63.0, 54.0, 34.0, 48.0, 41.0, 26.0, 30.0, 23.0, 10.0, 13.0, 8.0, 13.0, 3.0, 3.0, 8.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.75, -52.09765625, -50.4453125, -48.79296875, -47.140625, -45.48828125, -43.8359375, -42.18359375, -40.53125, -38.87890625, -37.2265625, -35.57421875, -33.921875, -32.26953125, -30.6171875, -28.96484375, -27.3125, -25.66015625, -24.0078125, -22.35546875, -20.703125, -19.05078125, -17.3984375, -15.74609375, -14.09375, -12.44140625, -10.7890625, -9.13671875, -7.484375, -5.83203125, -4.1796875, -2.52734375, -0.875, 0.77734375, 2.4296875, 4.08203125, 5.734375, 7.38671875, 9.0390625, 10.69140625, 12.34375, 13.99609375, 15.6484375, 17.30078125, 18.953125, 20.60546875, 22.2578125, 23.91015625, 25.5625, 27.21484375, 28.8671875, 30.51953125, 32.171875, 33.82421875, 35.4765625, 37.12890625, 38.78125, 40.43359375, 42.0859375, 43.73828125, 45.390625, 47.04296875, 48.6953125, 50.34765625, 52.0]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 10.0, 13.0, 16.0, 14.0, 27.0, 39.0, 60.0, 87.0, 136.0, 231.0, 413.0, 791.0, 1671.0, 4271.0, 16690.0, 115035.0, 821510.0, 68568.0, 12372.0, 3538.0, 1420.0, 634.0, 371.0, 212.0, 125.0, 81.0, 44.0, 35.0, 32.0, 23.0, 16.0, 11.0, 10.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-55.0625, -53.41357421875, -51.7646484375, -50.11572265625, -48.466796875, -46.81787109375, -45.1689453125, -43.52001953125, -41.87109375, -40.22216796875, -38.5732421875, -36.92431640625, -35.275390625, -33.62646484375, -31.9775390625, -30.32861328125, -28.6796875, -27.03076171875, -25.3818359375, -23.73291015625, -22.083984375, -20.43505859375, -18.7861328125, -17.13720703125, -15.48828125, -13.83935546875, -12.1904296875, -10.54150390625, -8.892578125, -7.24365234375, -5.5947265625, -3.94580078125, -2.296875, -0.64794921875, 1.0009765625, 2.64990234375, 4.298828125, 5.94775390625, 7.5966796875, 9.24560546875, 10.89453125, 12.54345703125, 14.1923828125, 15.84130859375, 17.490234375, 19.13916015625, 20.7880859375, 22.43701171875, 24.0859375, 25.73486328125, 27.3837890625, 29.03271484375, 30.681640625, 32.33056640625, 33.9794921875, 35.62841796875, 37.27734375, 38.92626953125, 40.5751953125, 42.22412109375, 43.873046875, 45.52197265625, 47.1708984375, 48.81982421875, 50.46875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 5.0, 9.0, 10.0, 13.0, 9.0, 12.0, 19.0, 20.0, 29.0, 26.0, 39.0, 63.0, 61.0, 79.0, 80.0, 75.0, 68.0, 66.0, 50.0, 50.0, 34.0, 34.0, 21.0, 17.0, 15.0, 21.0, 13.0, 11.0, 9.0, 17.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.875, -123.970703125, -119.06640625, -114.162109375, -109.2578125, -104.353515625, -99.44921875, -94.544921875, -89.640625, -84.736328125, -79.83203125, -74.927734375, -70.0234375, -65.119140625, -60.21484375, -55.310546875, -50.40625, -45.501953125, -40.59765625, -35.693359375, -30.7890625, -25.884765625, -20.98046875, -16.076171875, -11.171875, -6.267578125, -1.36328125, 3.541015625, 8.4453125, 13.349609375, 18.25390625, 23.158203125, 28.0625, 32.966796875, 37.87109375, 42.775390625, 47.6796875, 52.583984375, 57.48828125, 62.392578125, 67.296875, 72.201171875, 77.10546875, 82.009765625, 86.9140625, 91.818359375, 96.72265625, 101.626953125, 106.53125, 111.435546875, 116.33984375, 121.244140625, 126.1484375, 131.052734375, 135.95703125, 140.861328125, 145.765625, 150.669921875, 155.57421875, 160.478515625, 165.3828125, 170.287109375, 175.19140625, 180.095703125, 185.0]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 12.0, 10.0, 13.0, 23.0, 22.0, 28.0, 51.0, 63.0, 112.0, 185.0, 282.0, 544.0, 1158.0, 2551.0, 7019.0, 23580.0, 132927.0, 805627.0, 53278.0, 13157.0, 4313.0, 1769.0, 782.0, 387.0, 228.0, 143.0, 92.0, 54.0, 39.0, 18.0, 16.0, 15.0, 8.0, 10.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3671875, -10.03564453125, -9.7041015625, -9.37255859375, -9.041015625, -8.70947265625, -8.3779296875, -8.04638671875, -7.71484375, -7.38330078125, -7.0517578125, -6.72021484375, -6.388671875, -6.05712890625, -5.7255859375, -5.39404296875, -5.0625, -4.73095703125, -4.3994140625, -4.06787109375, -3.736328125, -3.40478515625, -3.0732421875, -2.74169921875, -2.41015625, -2.07861328125, -1.7470703125, -1.41552734375, -1.083984375, -0.75244140625, -0.4208984375, -0.08935546875, 0.2421875, 0.57373046875, 0.9052734375, 1.23681640625, 1.568359375, 1.89990234375, 2.2314453125, 2.56298828125, 2.89453125, 3.22607421875, 3.5576171875, 3.88916015625, 4.220703125, 4.55224609375, 4.8837890625, 5.21533203125, 5.546875, 5.87841796875, 6.2099609375, 6.54150390625, 6.873046875, 7.20458984375, 7.5361328125, 7.86767578125, 8.19921875, 8.53076171875, 8.8623046875, 9.19384765625, 9.525390625, 9.85693359375, 10.1884765625, 10.52001953125, 10.8515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 8.0, 8.0, 9.0, 9.0, 12.0, 6.0, 14.0, 14.0, 29.0, 25.0, 34.0, 44.0, 64.0, 86.0, 87.0, 100.0, 86.0, 72.0, 65.0, 35.0, 32.0, 24.0, 16.0, 22.0, 11.0, 14.0, 9.0, 8.0, 2.0, 7.0, 3.0, 6.0, 5.0, 1.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00231170654296875, -0.0022357702255249023, -0.0021598339080810547, -0.002083897590637207, -0.0020079612731933594, -0.0019320249557495117, -0.001856088638305664, -0.0017801523208618164, -0.0017042160034179688, -0.001628279685974121, -0.0015523433685302734, -0.0014764070510864258, -0.0014004707336425781, -0.0013245344161987305, -0.0012485980987548828, -0.0011726617813110352, -0.0010967254638671875, -0.0010207891464233398, -0.0009448528289794922, -0.0008689165115356445, -0.0007929801940917969, -0.0007170438766479492, -0.0006411075592041016, -0.0005651712417602539, -0.0004892349243164062, -0.0004132986068725586, -0.00033736228942871094, -0.0002614259719848633, -0.00018548965454101562, -0.00010955333709716797, -3.361701965332031e-05, 4.2319297790527344e-05, 0.000118255615234375, 0.00019419193267822266, 0.0002701282501220703, 0.00034606456756591797, 0.0004220008850097656, 0.0004979372024536133, 0.0005738735198974609, 0.0006498098373413086, 0.0007257461547851562, 0.0008016824722290039, 0.0008776187896728516, 0.0009535551071166992, 0.0010294914245605469, 0.0011054277420043945, 0.0011813640594482422, 0.0012573003768920898, 0.0013332366943359375, 0.0014091730117797852, 0.0014851093292236328, 0.0015610456466674805, 0.0016369819641113281, 0.0017129182815551758, 0.0017888545989990234, 0.001864790916442871, 0.0019407272338867188, 0.0020166635513305664, 0.002092599868774414, 0.0021685361862182617, 0.0022444725036621094, 0.002320408821105957, 0.0023963451385498047, 0.0024722814559936523, 0.0025482177734375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 14.0, 25.0, 39.0, 83.0, 168.0, 396.0, 1049.0, 3295.0, 13561.0, 94612.0, 873580.0, 49261.0, 8744.0, 2315.0, 758.0, 289.0, 152.0, 85.0, 33.0, 19.0, 19.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.359375, -17.7919921875, -17.224609375, -16.6572265625, -16.08984375, -15.5224609375, -14.955078125, -14.3876953125, -13.8203125, -13.2529296875, -12.685546875, -12.1181640625, -11.55078125, -10.9833984375, -10.416015625, -9.8486328125, -9.28125, -8.7138671875, -8.146484375, -7.5791015625, -7.01171875, -6.4443359375, -5.876953125, -5.3095703125, -4.7421875, -4.1748046875, -3.607421875, -3.0400390625, -2.47265625, -1.9052734375, -1.337890625, -0.7705078125, -0.203125, 0.3642578125, 0.931640625, 1.4990234375, 2.06640625, 2.6337890625, 3.201171875, 3.7685546875, 4.3359375, 4.9033203125, 5.470703125, 6.0380859375, 6.60546875, 7.1728515625, 7.740234375, 8.3076171875, 8.875, 9.4423828125, 10.009765625, 10.5771484375, 11.14453125, 11.7119140625, 12.279296875, 12.8466796875, 13.4140625, 13.9814453125, 14.548828125, 15.1162109375, 15.68359375, 16.2509765625, 16.818359375, 17.3857421875, 17.953125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 7.0, 4.0, 2.0, 8.0, 7.0, 7.0, 11.0, 14.0, 11.0, 14.0, 18.0, 41.0, 39.0, 80.0, 72.0, 106.0, 108.0, 96.0, 88.0, 64.0, 38.0, 38.0, 30.0, 22.0, 17.0, 8.0, 6.0, 12.0, 7.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.324951171875, -11.87646484375, -11.427978515625, -10.9794921875, -10.531005859375, -10.08251953125, -9.634033203125, -9.185546875, -8.737060546875, -8.28857421875, -7.840087890625, -7.3916015625, -6.943115234375, -6.49462890625, -6.046142578125, -5.59765625, -5.149169921875, -4.70068359375, -4.252197265625, -3.8037109375, -3.355224609375, -2.90673828125, -2.458251953125, -2.009765625, -1.561279296875, -1.11279296875, -0.664306640625, -0.2158203125, 0.232666015625, 0.68115234375, 1.129638671875, 1.578125, 2.026611328125, 2.47509765625, 2.923583984375, 3.3720703125, 3.820556640625, 4.26904296875, 4.717529296875, 5.166015625, 5.614501953125, 6.06298828125, 6.511474609375, 6.9599609375, 7.408447265625, 7.85693359375, 8.305419921875, 8.75390625, 9.202392578125, 9.65087890625, 10.099365234375, 10.5478515625, 10.996337890625, 11.44482421875, 11.893310546875, 12.341796875, 12.790283203125, 13.23876953125, 13.687255859375, 14.1357421875, 14.584228515625, 15.03271484375, 15.481201171875, 15.9296875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 7.0, 13.0, 25.0, 47.0, 91.0, 353.0, 227.0, 68.0, 50.0, 40.0, 21.0, 23.0, 10.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.28170776367188, -190.4730682373047, -176.66441345214844, -162.85577392578125, -149.047119140625, -135.2384796142578, -121.42984008789062, -107.6211929321289, -93.81254577636719, -80.00389862060547, -66.19525146484375, -52.38661193847656, -38.577964782714844, -24.769317626953125, -10.960678100585938, 2.8479690551757812, 16.6566162109375, 30.465261459350586, 44.27390670776367, 58.082550048828125, 71.89119720458984, 85.69984436035156, 99.50848388671875, 113.31713104248047, 127.12577819824219, 140.93441772460938, 154.74307250976562, 168.5517120361328, 182.3603515625, 196.16900634765625, 209.97764587402344, 223.78628540039062, 237.59490966796875, 251.40354919433594, 265.2121887207031, 279.0208435058594, 292.8294982910156, 306.63812255859375, 320.44677734375, 334.25543212890625, 348.0640869140625, 361.87274169921875, 375.6813659667969, 389.4900207519531, 403.2986755371094, 417.1072998046875, 430.91595458984375, 444.724609375, 458.5332336425781, 472.3418884277344, 486.1505126953125, 499.95916748046875, 513.767822265625, 527.5764770507812, 541.3851318359375, 555.1937255859375, 569.0023803710938, 582.81103515625, 596.6196899414062, 610.4283447265625, 624.2369384765625, 638.0455932617188, 651.854248046875, 665.6629028320312, 679.4715576171875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 6.0, 7.0, 12.0, 7.0, 20.0, 18.0, 24.0, 19.0, 21.0, 20.0, 37.0, 57.0, 154.0, 142.0, 136.0, 79.0, 33.0, 25.0, 25.0, 16.0, 21.0, 14.0, 16.0, 12.0, 17.0, 9.0, 3.0, 7.0, 9.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-413.6853942871094, -400.5760498046875, -387.4667053222656, -374.35736083984375, -361.24798583984375, -348.1386413574219, -335.029296875, -321.9199523925781, -308.81060791015625, -295.7012634277344, -282.5919189453125, -269.4825439453125, -256.3731994628906, -243.26385498046875, -230.15451049804688, -217.045166015625, -203.935791015625, -190.82644653320312, -177.7170867919922, -164.6077423095703, -151.49838256835938, -138.3890380859375, -125.27969360351562, -112.17034149169922, -99.06098937988281, -85.9516372680664, -72.84228515625, -59.732940673828125, -46.62358856201172, -33.51423645019531, -20.404891967773438, -7.295539855957031, 5.81378173828125, 18.923131942749023, 32.0324821472168, 45.14183044433594, 58.251182556152344, 71.36053466796875, 84.46987915039062, 97.57923126220703, 110.68858337402344, 123.79793548583984, 136.90728759765625, 150.01663208007812, 163.1259765625, 176.23533630371094, 189.3446807861328, 202.45404052734375, 215.56338500976562, 228.6727294921875, 241.78208923339844, 254.8914337158203, 268.00079345703125, 281.1101379394531, 294.219482421875, 307.3288269042969, 320.43817138671875, 333.5475158691406, 346.6568603515625, 359.7662353515625, 372.8755798339844, 385.98492431640625, 399.0942687988281, 412.20361328125, 425.31298828125]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 13.0, 13.0, 13.0, 25.0, 21.0, 30.0, 47.0, 47.0, 50.0, 89.0, 257.0, 113.0, 57.0, 44.0, 41.0, 28.0, 21.0, 16.0, 24.0, 15.0, 8.0, 6.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.03125, -40.25732421875, -38.4833984375, -36.70947265625, -34.935546875, -33.16162109375, -31.3876953125, -29.61376953125, -27.83984375, -26.06591796875, -24.2919921875, -22.51806640625, -20.744140625, -18.97021484375, -17.1962890625, -15.42236328125, -13.6484375, -11.87451171875, -10.1005859375, -8.32666015625, -6.552734375, -4.77880859375, -3.0048828125, -1.23095703125, 0.54296875, 2.31689453125, 4.0908203125, 5.86474609375, 7.638671875, 9.41259765625, 11.1865234375, 12.96044921875, 14.734375, 16.50830078125, 18.2822265625, 20.05615234375, 21.830078125, 23.60400390625, 25.3779296875, 27.15185546875, 28.92578125, 30.69970703125, 32.4736328125, 34.24755859375, 36.021484375, 37.79541015625, 39.5693359375, 41.34326171875, 43.1171875, 44.89111328125, 46.6650390625, 48.43896484375, 50.212890625, 51.98681640625, 53.7607421875, 55.53466796875, 57.30859375, 59.08251953125, 60.8564453125, 62.63037109375, 64.404296875, 66.17822265625, 67.9521484375, 69.72607421875, 71.5]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 4.0, 5.0, 4.0, 5.0, 5.0, 6.0, 13.0, 13.0, 21.0, 41.0, 68.0, 77.0, 143.0, 295.0, 552.0, 1470.0, 3972.0, 14510.0, 8246618.0, 107654.0, 8369.0, 2630.0, 1018.0, 444.0, 214.0, 135.0, 72.0, 47.0, 35.0, 18.0, 22.0, 9.0, 10.0, 14.0, 16.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0], "bins": [-173.3074951171875, -167.49594116210938, -161.6844024658203, -155.8728485107422, -150.06130981445312, -144.249755859375, -138.43820190429688, -132.62664794921875, -126.81510925292969, -121.0035629272461, -115.1920166015625, -109.38046264648438, -103.56891632080078, -97.75736999511719, -91.94581604003906, -86.13426971435547, -80.32272338867188, -74.51117706298828, -68.69963073730469, -62.88807678222656, -57.07653045654297, -51.264984130859375, -45.453433990478516, -39.641883850097656, -33.83033752441406, -28.018789291381836, -22.20724105834961, -16.395692825317383, -10.584144592285156, -4.77259635925293, 1.0389518737792969, 6.850502014160156, 12.662063598632812, 18.47361183166504, 24.285160064697266, 30.096708297729492, 35.90825653076172, 41.71980285644531, 47.53135299682617, 53.34290313720703, 59.154449462890625, 64.96599578857422, 70.77754211425781, 76.58909606933594, 82.40064239501953, 88.21218872070312, 94.02374267578125, 99.83528900146484, 105.64683532714844, 111.45838165283203, 117.26992797851562, 123.08148193359375, 128.89303588867188, 134.70457458496094, 140.51612854003906, 146.32766723632812, 152.13922119140625, 157.95077514648438, 163.76231384277344, 169.57386779785156, 175.38540649414062, 181.19696044921875, 187.00851440429688, 192.820068359375, 198.63160705566406]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 1.0, 1.0, 3.0, 6.0, 7.0, 0.0, 5.0, 4.0, 6.0, 7.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-320.3318786621094, -310.34954833984375, -300.3671875, -290.3848571777344, -280.40252685546875, -270.4201965332031, -260.4378662109375, -250.45550537109375, -240.47317504882812, -230.4908447265625, -220.5084991455078, -210.52615356445312, -200.5438232421875, -190.56149291992188, -180.5791473388672, -170.5968017578125, -160.61447143554688, -150.63214111328125, -140.64979553222656, -130.66744995117188, -120.68511962890625, -110.7027816772461, -100.72044372558594, -90.73810577392578, -80.75576782226562, -70.77342987060547, -60.79109191894531, -50.808753967285156, -40.826416015625, -30.844078063964844, -20.861740112304688, -10.879402160644531, -0.8970947265625, 9.085243225097656, 19.067581176757812, 29.04991912841797, 39.032257080078125, 49.01459503173828, 58.99693298339844, 68.9792709350586, 78.96160888671875, 88.9439468383789, 98.92628479003906, 108.90862274169922, 118.89096069335938, 128.873291015625, 138.8556365966797, 148.83798217773438, 158.8203125, 168.80264282226562, 178.7849884033203, 188.767333984375, 198.74966430664062, 208.73199462890625, 218.71434020996094, 228.69668579101562, 238.67901611328125, 248.66134643554688, 258.6436767578125, 268.62603759765625, 278.6083679199219, 288.5906982421875, 298.57305908203125, 308.5553894042969, 318.5377197265625]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 9.0, 7.0, 4.0, 18.0, 23.0, 30.0, 35.0, 43.0, 59.0, 66.0, 65.0, 59.0, 48.0, 89.0, 80.0, 72.0, 64.0, 52.0, 46.0, 32.0, 27.0, 18.0, 11.0, 12.0, 8.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.375, -46.8662109375, -45.357421875, -43.8486328125, -42.33984375, -40.8310546875, -39.322265625, -37.8134765625, -36.3046875, -34.7958984375, -33.287109375, -31.7783203125, -30.26953125, -28.7607421875, -27.251953125, -25.7431640625, -24.234375, -22.7255859375, -21.216796875, -19.7080078125, -18.19921875, -16.6904296875, -15.181640625, -13.6728515625, -12.1640625, -10.6552734375, -9.146484375, -7.6376953125, -6.12890625, -4.6201171875, -3.111328125, -1.6025390625, -0.09375, 1.4150390625, 2.923828125, 4.4326171875, 5.94140625, 7.4501953125, 8.958984375, 10.4677734375, 11.9765625, 13.4853515625, 14.994140625, 16.5029296875, 18.01171875, 19.5205078125, 21.029296875, 22.5380859375, 24.046875, 25.5556640625, 27.064453125, 28.5732421875, 30.08203125, 31.5908203125, 33.099609375, 34.6083984375, 36.1171875, 37.6259765625, 39.134765625, 40.6435546875, 42.15234375, 43.6611328125, 45.169921875, 46.6787109375, 48.1875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 10.0, 15.0, 17.0, 44.0, 54.0, 66.0, 173.0, 342.0, 964.0, 2944.0, 11643.0, 54689.0, 244808.0, 165094.0, 32766.0, 7368.0, 1992.0, 710.0, 275.0, 122.0, 66.0, 33.0, 26.0, 28.0, 4.0, 4.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-351.25, -341.16796875, -331.0859375, -321.00390625, -310.921875, -300.83984375, -290.7578125, -280.67578125, -270.59375, -260.51171875, -250.4296875, -240.34765625, -230.265625, -220.18359375, -210.1015625, -200.01953125, -189.9375, -179.85546875, -169.7734375, -159.69140625, -149.609375, -139.52734375, -129.4453125, -119.36328125, -109.28125, -99.19921875, -89.1171875, -79.03515625, -68.953125, -58.87109375, -48.7890625, -38.70703125, -28.625, -18.54296875, -8.4609375, 1.62109375, 11.703125, 21.78515625, 31.8671875, 41.94921875, 52.03125, 62.11328125, 72.1953125, 82.27734375, 92.359375, 102.44140625, 112.5234375, 122.60546875, 132.6875, 142.76953125, 152.8515625, 162.93359375, 173.015625, 183.09765625, 193.1796875, 203.26171875, 213.34375, 223.42578125, 233.5078125, 243.58984375, 253.671875, 263.75390625, 273.8359375, 283.91796875, 294.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 9.0, 16.0, 8.0, 18.0, 14.0, 16.0, 37.0, 25.0, 36.0, 34.0, 48.0, 50.0, 39.0, 53.0, 68.0, 49.0, 54.0, 60.0, 40.0, 44.0, 44.0, 39.0, 36.0, 28.0, 18.0, 21.0, 16.0, 13.0, 9.0, 7.0, 5.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.59375, -27.64453125, -26.6953125, -25.74609375, -24.796875, -23.84765625, -22.8984375, -21.94921875, -21.0, -20.05078125, -19.1015625, -18.15234375, -17.203125, -16.25390625, -15.3046875, -14.35546875, -13.40625, -12.45703125, -11.5078125, -10.55859375, -9.609375, -8.66015625, -7.7109375, -6.76171875, -5.8125, -4.86328125, -3.9140625, -2.96484375, -2.015625, -1.06640625, -0.1171875, 0.83203125, 1.78125, 2.73046875, 3.6796875, 4.62890625, 5.578125, 6.52734375, 7.4765625, 8.42578125, 9.375, 10.32421875, 11.2734375, 12.22265625, 13.171875, 14.12109375, 15.0703125, 16.01953125, 16.96875, 17.91796875, 18.8671875, 19.81640625, 20.765625, 21.71484375, 22.6640625, 23.61328125, 24.5625, 25.51171875, 26.4609375, 27.41015625, 28.359375, 29.30859375, 30.2578125, 31.20703125, 32.15625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 12.0, 15.0, 27.0, 69.0, 92.0, 117.0, 63.0, 18.0, 12.0, 7.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-358.60430908203125, -348.249267578125, -337.89422607421875, -327.5391845703125, -317.18414306640625, -306.8290710449219, -296.4740295410156, -286.1189880371094, -275.7639465332031, -265.4089050292969, -255.05386352539062, -244.6988067626953, -234.34376525878906, -223.9887237548828, -213.6336669921875, -203.27862548828125, -192.923583984375, -182.56854248046875, -172.2135009765625, -161.8584442138672, -151.50340270996094, -141.1483612060547, -130.79330444335938, -120.43826293945312, -110.08322143554688, -99.72817993164062, -89.37313079833984, -79.01808166503906, -68.66304016113281, -58.3079948425293, -47.95294952392578, -37.597900390625, -27.24285888671875, -16.887813568115234, -6.532768249511719, 3.822277069091797, 14.177322387695312, 24.532367706298828, 34.887413024902344, 45.242462158203125, 55.597503662109375, 65.95254516601562, 76.3075942993164, 86.66264343261719, 97.01768493652344, 107.37272644042969, 117.72777557373047, 128.08282470703125, 138.4378662109375, 148.79290771484375, 159.14794921875, 169.5030059814453, 179.85804748535156, 190.2130889892578, 200.56814575195312, 210.92318725585938, 221.27822875976562, 231.63327026367188, 241.98831176757812, 252.34336853027344, 262.69842529296875, 273.053466796875, 283.40850830078125, 293.7635498046875, 304.11859130859375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 4.0, 9.0, 5.0, 6.0, 11.0, 17.0, 30.0, 45.0, 81.0, 87.0, 69.0, 40.0, 23.0, 7.0, 5.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-271.1093444824219, -264.0339660644531, -256.9585876464844, -249.8832244873047, -242.80784606933594, -235.7324676513672, -228.6571044921875, -221.58172607421875, -214.50634765625, -207.43096923828125, -200.3555908203125, -193.2802276611328, -186.20484924316406, -179.1294708251953, -172.05410766601562, -164.97872924804688, -157.90335083007812, -150.82797241210938, -143.75259399414062, -136.67723083496094, -129.6018524169922, -122.52647399902344, -115.45110321044922, -108.375732421875, -101.30035400390625, -94.2249755859375, -87.14960479736328, -80.07423400878906, -72.99885559082031, -65.92347717285156, -58.848106384277344, -51.77273178100586, -44.69734191894531, -37.62196731567383, -30.546592712402344, -23.47121810913086, -16.395843505859375, -9.32046890258789, -2.2450942993164062, 4.830280303955078, 11.905654907226562, 18.981029510498047, 26.05640411376953, 33.131778717041016, 40.2071533203125, 47.282527923583984, 54.35790252685547, 61.43327713012695, 68.50865173339844, 75.58403015136719, 82.6594009399414, 89.73477172851562, 96.81015014648438, 103.88552856445312, 110.96089935302734, 118.03627014160156, 125.11164855957031, 132.18702697753906, 139.26239013671875, 146.3377685546875, 153.41314697265625, 160.488525390625, 167.56390380859375, 174.63926696777344, 181.7146453857422]}, "eval/loss": 0.6976933479309082, "eval/wer": 0.12308607695358985, "eval/runtime": 636.3851, "eval/samples_per_second": 4.152, "eval/steps_per_second": 0.52} \ No newline at end of file +{"train/loss": 0.2868, "train/learning_rate": 1.1267605633802817e-08, "train/epoch": 25.0, "train/global_step": 22300, "_runtime": 134750, "_timestamp": 1648276094, "_step": 22314, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 6.0, 5.0, 7.0, 6.0, 24.0, 16.0, 17.0, 28.0, 27.0, 41.0, 41.0, 57.0, 59.0, 69.0, 82.0, 96.0, 86.0, 78.0, 58.0, 45.0, 38.0, 26.0, 29.0, 15.0, 12.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-151.30198669433594, -147.59866333007812, -143.8953399658203, -140.1920166015625, -136.4886932373047, -132.78536987304688, -129.08204650878906, -125.37871551513672, -121.6753921508789, -117.9720687866211, -114.26874542236328, -110.56542205810547, -106.86209106445312, -103.15876770019531, -99.4554443359375, -95.75212097167969, -92.04879760742188, -88.34547424316406, -84.64215087890625, -80.93882751464844, -77.23550415039062, -73.53218078613281, -69.82884979248047, -66.12552642822266, -62.422203063964844, -58.71887969970703, -55.01555633544922, -51.31222915649414, -47.60890579223633, -43.905582427978516, -40.20225524902344, -36.498931884765625, -32.795616149902344, -29.09229278564453, -25.388967514038086, -21.68564224243164, -17.982318878173828, -14.278995513916016, -10.57567024230957, -6.872344970703125, -3.1690216064453125, 0.5343027114868164, 4.237627029418945, 7.940951347351074, 11.644275665283203, 15.347599029541016, 19.05092430114746, 22.754249572753906, 26.45757293701172, 30.16089630126953, 33.864219665527344, 37.56754684448242, 41.270870208740234, 44.97419357299805, 48.677520751953125, 52.38084411621094, 56.08416748046875, 59.78749084472656, 63.490814208984375, 67.19413757324219, 70.8974609375, 74.60078430175781, 78.30411529541016, 82.00743865966797, 85.71076202392578]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 5.0, 5.0, 9.0, 6.0, 9.0, 9.0, 17.0, 11.0, 20.0, 22.0, 17.0, 22.0, 27.0, 28.0, 41.0, 43.0, 41.0, 38.0, 29.0, 37.0, 41.0, 42.0, 39.0, 49.0, 32.0, 36.0, 39.0, 43.0, 36.0, 28.0, 21.0, 19.0, 23.0, 23.0, 17.0, 19.0, 14.0, 11.0, 9.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-68.2059097290039, -65.8742904663086, -63.54267501831055, -61.2110595703125, -58.87944030761719, -56.54782485961914, -54.216209411621094, -51.88459014892578, -49.552974700927734, -47.22135925292969, -44.889739990234375, -42.55812454223633, -40.22650909423828, -37.89488983154297, -35.56327438354492, -33.231658935546875, -30.900039672851562, -28.568422317504883, -26.236804962158203, -23.905189514160156, -21.573572158813477, -19.241954803466797, -16.91033935546875, -14.57872200012207, -12.24710464477539, -9.915487289428711, -7.583870887756348, -5.252254009246826, -2.9206371307373047, -0.589019775390625, 1.7425966262817383, 4.074213027954102, 6.4058380126953125, 8.737455368041992, 11.069071769714355, 13.400688171386719, 15.732305526733398, 18.063922882080078, 20.395538330078125, 22.727155685424805, 25.058773040771484, 27.390390396118164, 29.722007751464844, 32.05362319946289, 34.38523864746094, 36.71685791015625, 39.0484733581543, 41.380088806152344, 43.711708068847656, 46.0433235168457, 48.374942779541016, 50.70655822753906, 53.038177490234375, 55.36979293823242, 57.70140838623047, 60.03302764892578, 62.36464309692383, 64.69625854492188, 67.02787780761719, 69.3594970703125, 71.69110870361328, 74.0227279663086, 76.3543472290039, 78.68595886230469, 81.017578125]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 11.0, 12.0, 18.0, 28.0, 29.0, 53.0, 108.0, 107.0, 163.0, 256.0, 330.0, 564.0, 776.0, 1236.0, 1872.0, 3065.0, 4669.0, 7626.0, 12886.0, 22633.0, 41141.0, 80592.0, 188661.0, 947081.0, 2287244.0, 348355.0, 115935.0, 55682.0, 29584.0, 16883.0, 9812.0, 5959.0, 3823.0, 2390.0, 1520.0, 1027.0, 673.0, 441.0, 317.0, 229.0, 154.0, 100.0, 75.0, 41.0, 39.0, 20.0, 21.0, 11.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-244.5, -236.67578125, -228.8515625, -221.02734375, -213.203125, -205.37890625, -197.5546875, -189.73046875, -181.90625, -174.08203125, -166.2578125, -158.43359375, -150.609375, -142.78515625, -134.9609375, -127.13671875, -119.3125, -111.48828125, -103.6640625, -95.83984375, -88.015625, -80.19140625, -72.3671875, -64.54296875, -56.71875, -48.89453125, -41.0703125, -33.24609375, -25.421875, -17.59765625, -9.7734375, -1.94921875, 5.875, 13.69921875, 21.5234375, 29.34765625, 37.171875, 44.99609375, 52.8203125, 60.64453125, 68.46875, 76.29296875, 84.1171875, 91.94140625, 99.765625, 107.58984375, 115.4140625, 123.23828125, 131.0625, 138.88671875, 146.7109375, 154.53515625, 162.359375, 170.18359375, 178.0078125, 185.83203125, 193.65625, 201.48046875, 209.3046875, 217.12890625, 224.953125, 232.77734375, 240.6015625, 248.42578125, 256.25]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 6.0, 5.0, 15.0, 13.0, 16.0, 16.0, 22.0, 22.0, 35.0, 32.0, 24.0, 40.0, 39.0, 38.0, 48.0, 53.0, 53.0, 38.0, 57.0, 37.0, 41.0, 35.0, 37.0, 40.0, 33.0, 40.0, 27.0, 18.0, 25.0, 19.0, 18.0, 10.0, 14.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.5, -73.923828125, -71.34765625, -68.771484375, -66.1953125, -63.619140625, -61.04296875, -58.466796875, -55.890625, -53.314453125, -50.73828125, -48.162109375, -45.5859375, -43.009765625, -40.43359375, -37.857421875, -35.28125, -32.705078125, -30.12890625, -27.552734375, -24.9765625, -22.400390625, -19.82421875, -17.248046875, -14.671875, -12.095703125, -9.51953125, -6.943359375, -4.3671875, -1.791015625, 0.78515625, 3.361328125, 5.9375, 8.513671875, 11.08984375, 13.666015625, 16.2421875, 18.818359375, 21.39453125, 23.970703125, 26.546875, 29.123046875, 31.69921875, 34.275390625, 36.8515625, 39.427734375, 42.00390625, 44.580078125, 47.15625, 49.732421875, 52.30859375, 54.884765625, 57.4609375, 60.037109375, 62.61328125, 65.189453125, 67.765625, 70.341796875, 72.91796875, 75.494140625, 78.0703125, 80.646484375, 83.22265625, 85.798828125, 88.375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 4.0, 7.0, 20.0, 13.0, 26.0, 36.0, 60.0, 61.0, 107.0, 158.0, 234.0, 376.0, 559.0, 822.0, 1219.0, 1891.0, 2835.0, 4483.0, 6999.0, 11484.0, 18649.0, 30897.0, 51990.0, 92909.0, 172017.0, 372599.0, 1327744.0, 1326657.0, 371097.0, 172183.0, 92267.0, 52629.0, 30890.0, 18748.0, 11327.0, 7083.0, 4602.0, 2971.0, 1872.0, 1273.0, 849.0, 554.0, 355.0, 248.0, 153.0, 111.0, 74.0, 40.0, 28.0, 33.0, 17.0, 10.0, 14.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-139.5, -135.0, -130.5, -126.0, -121.5, -117.0, -112.5, -108.0, -103.5, -99.0, -94.5, -90.0, -85.5, -81.0, -76.5, -72.0, -67.5, -63.0, -58.5, -54.0, -49.5, -45.0, -40.5, -36.0, -31.5, -27.0, -22.5, -18.0, -13.5, -9.0, -4.5, 0.0, 4.5, 9.0, 13.5, 18.0, 22.5, 27.0, 31.5, 36.0, 40.5, 45.0, 49.5, 54.0, 58.5, 63.0, 67.5, 72.0, 76.5, 81.0, 85.5, 90.0, 94.5, 99.0, 103.5, 108.0, 112.5, 117.0, 121.5, 126.0, 130.5, 135.0, 139.5, 144.0, 148.5]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 8.0, 9.0, 10.0, 14.0, 13.0, 21.0, 25.0, 29.0, 37.0, 45.0, 39.0, 60.0, 77.0, 63.0, 91.0, 122.0, 121.0, 154.0, 196.0, 273.0, 395.0, 473.0, 384.0, 271.0, 196.0, 160.0, 122.0, 113.0, 95.0, 72.0, 69.0, 50.0, 55.0, 37.0, 27.0, 33.0, 22.0, 22.0, 19.0, 15.0, 6.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.5, -37.1904296875, -35.880859375, -34.5712890625, -33.26171875, -31.9521484375, -30.642578125, -29.3330078125, -28.0234375, -26.7138671875, -25.404296875, -24.0947265625, -22.78515625, -21.4755859375, -20.166015625, -18.8564453125, -17.546875, -16.2373046875, -14.927734375, -13.6181640625, -12.30859375, -10.9990234375, -9.689453125, -8.3798828125, -7.0703125, -5.7607421875, -4.451171875, -3.1416015625, -1.83203125, -0.5224609375, 0.787109375, 2.0966796875, 3.40625, 4.7158203125, 6.025390625, 7.3349609375, 8.64453125, 9.9541015625, 11.263671875, 12.5732421875, 13.8828125, 15.1923828125, 16.501953125, 17.8115234375, 19.12109375, 20.4306640625, 21.740234375, 23.0498046875, 24.359375, 25.6689453125, 26.978515625, 28.2880859375, 29.59765625, 30.9072265625, 32.216796875, 33.5263671875, 34.8359375, 36.1455078125, 37.455078125, 38.7646484375, 40.07421875, 41.3837890625, 42.693359375, 44.0029296875, 45.3125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 8.0, 9.0, 10.0, 12.0, 17.0, 13.0, 20.0, 25.0, 30.0, 36.0, 38.0, 49.0, 56.0, 69.0, 71.0, 65.0, 79.0, 60.0, 48.0, 52.0, 39.0, 31.0, 24.0, 20.0, 18.0, 16.0, 11.0, 11.0, 12.0, 9.0, 7.0, 6.0, 4.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.65741729736328, -107.41815948486328, -104.17890930175781, -100.93965148925781, -97.70040130615234, -94.46114349365234, -91.22189331054688, -87.98263549804688, -84.7433853149414, -81.5041275024414, -78.26487731933594, -75.02561950683594, -71.78636932373047, -68.54711151123047, -65.307861328125, -62.068603515625, -58.829349517822266, -55.59009552001953, -52.3508415222168, -49.11158752441406, -45.87233352661133, -42.633079528808594, -39.393821716308594, -36.154571533203125, -32.915313720703125, -29.67605972290039, -26.436805725097656, -23.197551727294922, -19.958297729492188, -16.71904182434082, -13.479787826538086, -10.240533828735352, -7.00128173828125, -3.7620275020599365, -0.522773265838623, 2.7164812088012695, 5.955735206604004, 9.194990158081055, 12.434244155883789, 15.673498153686523, 18.912752151489258, 22.152006149291992, 25.391260147094727, 28.630516052246094, 31.869770050048828, 35.10902404785156, 38.3482780456543, 41.58753204345703, 44.826786041259766, 48.0660400390625, 51.305294036865234, 54.54454803466797, 57.7838020324707, 61.02305603027344, 64.26231384277344, 67.5015640258789, 70.7408218383789, 73.9800796508789, 77.21932983398438, 80.45858764648438, 83.69783782958984, 86.93709564208984, 90.17634582519531, 93.41560363769531, 96.65485382080078]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 10.0, 8.0, 6.0, 13.0, 15.0, 16.0, 26.0, 25.0, 34.0, 25.0, 30.0, 30.0, 37.0, 28.0, 49.0, 48.0, 43.0, 34.0, 41.0, 42.0, 50.0, 34.0, 32.0, 41.0, 42.0, 37.0, 29.0, 22.0, 22.0, 21.0, 22.0, 16.0, 17.0, 9.0, 16.0, 8.0, 7.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-101.45652770996094, -98.67851257324219, -95.9004898071289, -93.12247467041016, -90.34445190429688, -87.56643676757812, -84.78842163085938, -82.0103988647461, -79.23237609863281, -76.45436096191406, -73.67633819580078, -70.89832305908203, -68.12030029296875, -65.34228515625, -62.564266204833984, -59.78624725341797, -57.00823211669922, -54.2302131652832, -51.45219421386719, -48.67417907714844, -45.896156311035156, -43.118141174316406, -40.34012222290039, -37.562103271484375, -34.78408432006836, -32.006065368652344, -29.228046417236328, -26.450029373168945, -23.67201042175293, -20.893991470336914, -18.11597442626953, -15.337955474853516, -12.559944152832031, -9.781925201416016, -7.003907203674316, -4.225889205932617, -1.4478702545166016, 1.330148696899414, 4.108165740966797, 6.8861846923828125, 9.664203643798828, 12.442222595214844, 15.220240592956543, 17.998258590698242, 20.776277542114258, 23.554296493530273, 26.332313537597656, 29.110332489013672, 31.888351440429688, 34.6663703918457, 37.44438934326172, 40.22240447998047, 43.00042724609375, 45.7784423828125, 48.556461334228516, 51.33448028564453, 54.11249923706055, 56.89051818847656, 59.66853713989258, 62.446556091308594, 65.22457122802734, 68.00259399414062, 70.78060913085938, 73.55862426757812, 76.3366470336914]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 9.0, 26.0, 24.0, 39.0, 48.0, 84.0, 112.0, 173.0, 247.0, 394.0, 600.0, 972.0, 1362.0, 2078.0, 3369.0, 5550.0, 9380.0, 15744.0, 27919.0, 51158.0, 97672.0, 192739.0, 285786.0, 164591.0, 83739.0, 44649.0, 24379.0, 13724.0, 8155.0, 5048.0, 3137.0, 2009.0, 1239.0, 806.0, 506.0, 340.0, 213.0, 175.0, 123.0, 72.0, 50.0, 37.0, 24.0, 14.0, 15.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-136.375, -132.1640625, -127.953125, -123.7421875, -119.53125, -115.3203125, -111.109375, -106.8984375, -102.6875, -98.4765625, -94.265625, -90.0546875, -85.84375, -81.6328125, -77.421875, -73.2109375, -69.0, -64.7890625, -60.578125, -56.3671875, -52.15625, -47.9453125, -43.734375, -39.5234375, -35.3125, -31.1015625, -26.890625, -22.6796875, -18.46875, -14.2578125, -10.046875, -5.8359375, -1.625, 2.5859375, 6.796875, 11.0078125, 15.21875, 19.4296875, 23.640625, 27.8515625, 32.0625, 36.2734375, 40.484375, 44.6953125, 48.90625, 53.1171875, 57.328125, 61.5390625, 65.75, 69.9609375, 74.171875, 78.3828125, 82.59375, 86.8046875, 91.015625, 95.2265625, 99.4375, 103.6484375, 107.859375, 112.0703125, 116.28125, 120.4921875, 124.703125, 128.9140625, 133.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 9.0, 4.0, 8.0, 8.0, 18.0, 17.0, 18.0, 25.0, 28.0, 28.0, 36.0, 27.0, 40.0, 37.0, 43.0, 51.0, 56.0, 49.0, 43.0, 38.0, 38.0, 37.0, 35.0, 36.0, 46.0, 27.0, 27.0, 29.0, 15.0, 22.0, 27.0, 11.0, 17.0, 9.0, 14.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-101.3125, -98.515625, -95.71875, -92.921875, -90.125, -87.328125, -84.53125, -81.734375, -78.9375, -76.140625, -73.34375, -70.546875, -67.75, -64.953125, -62.15625, -59.359375, -56.5625, -53.765625, -50.96875, -48.171875, -45.375, -42.578125, -39.78125, -36.984375, -34.1875, -31.390625, -28.59375, -25.796875, -23.0, -20.203125, -17.40625, -14.609375, -11.8125, -9.015625, -6.21875, -3.421875, -0.625, 2.171875, 4.96875, 7.765625, 10.5625, 13.359375, 16.15625, 18.953125, 21.75, 24.546875, 27.34375, 30.140625, 32.9375, 35.734375, 38.53125, 41.328125, 44.125, 46.921875, 49.71875, 52.515625, 55.3125, 58.109375, 60.90625, 63.703125, 66.5, 69.296875, 72.09375, 74.890625, 77.6875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 7.0, 13.0, 19.0, 24.0, 34.0, 45.0, 66.0, 85.0, 112.0, 158.0, 243.0, 334.0, 523.0, 690.0, 988.0, 1460.0, 2228.0, 3397.0, 5229.0, 8498.0, 14213.0, 24711.0, 45831.0, 94309.0, 216723.0, 322761.0, 151198.0, 68890.0, 35120.0, 19395.0, 11253.0, 6939.0, 4341.0, 2797.0, 1896.0, 1244.0, 798.0, 608.0, 414.0, 270.0, 184.0, 124.0, 102.0, 74.0, 62.0, 41.0, 31.0, 19.0, 10.0, 9.0, 9.0, 4.0, 3.0, 7.0, 3.0, 2.0, 4.0], "bins": [-166.0, -160.859375, -155.71875, -150.578125, -145.4375, -140.296875, -135.15625, -130.015625, -124.875, -119.734375, -114.59375, -109.453125, -104.3125, -99.171875, -94.03125, -88.890625, -83.75, -78.609375, -73.46875, -68.328125, -63.1875, -58.046875, -52.90625, -47.765625, -42.625, -37.484375, -32.34375, -27.203125, -22.0625, -16.921875, -11.78125, -6.640625, -1.5, 3.640625, 8.78125, 13.921875, 19.0625, 24.203125, 29.34375, 34.484375, 39.625, 44.765625, 49.90625, 55.046875, 60.1875, 65.328125, 70.46875, 75.609375, 80.75, 85.890625, 91.03125, 96.171875, 101.3125, 106.453125, 111.59375, 116.734375, 121.875, 127.015625, 132.15625, 137.296875, 142.4375, 147.578125, 152.71875, 157.859375, 163.0]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 7.0, 3.0, 10.0, 19.0, 18.0, 21.0, 16.0, 20.0, 21.0, 24.0, 28.0, 34.0, 32.0, 41.0, 50.0, 37.0, 50.0, 44.0, 42.0, 44.0, 38.0, 52.0, 42.0, 51.0, 31.0, 39.0, 32.0, 18.0, 23.0, 11.0, 24.0, 16.0, 6.0, 12.0, 12.0, 6.0, 5.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.21875, -57.23388671875, -55.2490234375, -53.26416015625, -51.279296875, -49.29443359375, -47.3095703125, -45.32470703125, -43.33984375, -41.35498046875, -39.3701171875, -37.38525390625, -35.400390625, -33.41552734375, -31.4306640625, -29.44580078125, -27.4609375, -25.47607421875, -23.4912109375, -21.50634765625, -19.521484375, -17.53662109375, -15.5517578125, -13.56689453125, -11.58203125, -9.59716796875, -7.6123046875, -5.62744140625, -3.642578125, -1.65771484375, 0.3271484375, 2.31201171875, 4.296875, 6.28173828125, 8.2666015625, 10.25146484375, 12.236328125, 14.22119140625, 16.2060546875, 18.19091796875, 20.17578125, 22.16064453125, 24.1455078125, 26.13037109375, 28.115234375, 30.10009765625, 32.0849609375, 34.06982421875, 36.0546875, 38.03955078125, 40.0244140625, 42.00927734375, 43.994140625, 45.97900390625, 47.9638671875, 49.94873046875, 51.93359375, 53.91845703125, 55.9033203125, 57.88818359375, 59.873046875, 61.85791015625, 63.8427734375, 65.82763671875, 67.8125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 6.0, 16.0, 10.0, 16.0, 17.0, 25.0, 34.0, 50.0, 68.0, 106.0, 120.0, 207.0, 333.0, 490.0, 827.0, 1416.0, 2519.0, 5305.0, 14173.0, 68530.0, 698566.0, 211555.0, 27635.0, 8116.0, 3588.0, 1828.0, 1113.0, 652.0, 415.0, 286.0, 164.0, 112.0, 81.0, 50.0, 35.0, 36.0, 16.0, 13.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-159.875, -155.13671875, -150.3984375, -145.66015625, -140.921875, -136.18359375, -131.4453125, -126.70703125, -121.96875, -117.23046875, -112.4921875, -107.75390625, -103.015625, -98.27734375, -93.5390625, -88.80078125, -84.0625, -79.32421875, -74.5859375, -69.84765625, -65.109375, -60.37109375, -55.6328125, -50.89453125, -46.15625, -41.41796875, -36.6796875, -31.94140625, -27.203125, -22.46484375, -17.7265625, -12.98828125, -8.25, -3.51171875, 1.2265625, 5.96484375, 10.703125, 15.44140625, 20.1796875, 24.91796875, 29.65625, 34.39453125, 39.1328125, 43.87109375, 48.609375, 53.34765625, 58.0859375, 62.82421875, 67.5625, 72.30078125, 77.0390625, 81.77734375, 86.515625, 91.25390625, 95.9921875, 100.73046875, 105.46875, 110.20703125, 114.9453125, 119.68359375, 124.421875, 129.16015625, 133.8984375, 138.63671875, 143.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 15.0, 17.0, 22.0, 48.0, 69.0, 143.0, 243.0, 187.0, 101.0, 54.0, 45.0, 15.0, 18.0, 6.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007694244384765625, -0.007286727428436279, -0.006879210472106934, -0.006471693515777588, -0.006064176559448242, -0.0056566596031188965, -0.005249142646789551, -0.004841625690460205, -0.004434108734130859, -0.004026591777801514, -0.003619074821472168, -0.0032115578651428223, -0.0028040409088134766, -0.002396523952484131, -0.001989006996154785, -0.0015814900398254395, -0.0011739730834960938, -0.000766456127166748, -0.00035893917083740234, 4.857778549194336e-05, 0.00045609474182128906, 0.0008636116981506348, 0.0012711286544799805, 0.0016786456108093262, 0.002086162567138672, 0.0024936795234680176, 0.0029011964797973633, 0.003308713436126709, 0.0037162303924560547, 0.0041237473487854, 0.004531264305114746, 0.004938781261444092, 0.0053462982177734375, 0.005753815174102783, 0.006161332130432129, 0.006568849086761475, 0.00697636604309082, 0.007383882999420166, 0.007791399955749512, 0.008198916912078857, 0.008606433868408203, 0.009013950824737549, 0.009421467781066895, 0.00982898473739624, 0.010236501693725586, 0.010644018650054932, 0.011051535606384277, 0.011459052562713623, 0.011866569519042969, 0.012274086475372314, 0.01268160343170166, 0.013089120388031006, 0.013496637344360352, 0.013904154300689697, 0.014311671257019043, 0.014719188213348389, 0.015126705169677734, 0.01553422212600708, 0.015941739082336426, 0.01634925603866577, 0.016756772994995117, 0.017164289951324463, 0.01757180690765381, 0.017979323863983154, 0.0183868408203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 9.0, 10.0, 16.0, 20.0, 31.0, 37.0, 58.0, 74.0, 94.0, 134.0, 155.0, 234.0, 334.0, 498.0, 635.0, 947.0, 1422.0, 2075.0, 3224.0, 5257.0, 9635.0, 17862.0, 37229.0, 86105.0, 228337.0, 372032.0, 157571.0, 61598.0, 27801.0, 14210.0, 7636.0, 4549.0, 2787.0, 1787.0, 1180.0, 863.0, 599.0, 406.0, 295.0, 219.0, 142.0, 127.0, 84.0, 67.0, 48.0, 41.0, 31.0, 10.0, 13.0, 5.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-60.75, -58.8701171875, -56.990234375, -55.1103515625, -53.23046875, -51.3505859375, -49.470703125, -47.5908203125, -45.7109375, -43.8310546875, -41.951171875, -40.0712890625, -38.19140625, -36.3115234375, -34.431640625, -32.5517578125, -30.671875, -28.7919921875, -26.912109375, -25.0322265625, -23.15234375, -21.2724609375, -19.392578125, -17.5126953125, -15.6328125, -13.7529296875, -11.873046875, -9.9931640625, -8.11328125, -6.2333984375, -4.353515625, -2.4736328125, -0.59375, 1.2861328125, 3.166015625, 5.0458984375, 6.92578125, 8.8056640625, 10.685546875, 12.5654296875, 14.4453125, 16.3251953125, 18.205078125, 20.0849609375, 21.96484375, 23.8447265625, 25.724609375, 27.6044921875, 29.484375, 31.3642578125, 33.244140625, 35.1240234375, 37.00390625, 38.8837890625, 40.763671875, 42.6435546875, 44.5234375, 46.4033203125, 48.283203125, 50.1630859375, 52.04296875, 53.9228515625, 55.802734375, 57.6826171875, 59.5625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 3.0, 13.0, 13.0, 15.0, 23.0, 27.0, 25.0, 44.0, 70.0, 45.0, 71.0, 79.0, 96.0, 93.0, 78.0, 59.0, 47.0, 30.0, 30.0, 28.0, 22.0, 17.0, 15.0, 9.0, 4.0, 12.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.265625, -19.658203125, -19.05078125, -18.443359375, -17.8359375, -17.228515625, -16.62109375, -16.013671875, -15.40625, -14.798828125, -14.19140625, -13.583984375, -12.9765625, -12.369140625, -11.76171875, -11.154296875, -10.546875, -9.939453125, -9.33203125, -8.724609375, -8.1171875, -7.509765625, -6.90234375, -6.294921875, -5.6875, -5.080078125, -4.47265625, -3.865234375, -3.2578125, -2.650390625, -2.04296875, -1.435546875, -0.828125, -0.220703125, 0.38671875, 0.994140625, 1.6015625, 2.208984375, 2.81640625, 3.423828125, 4.03125, 4.638671875, 5.24609375, 5.853515625, 6.4609375, 7.068359375, 7.67578125, 8.283203125, 8.890625, 9.498046875, 10.10546875, 10.712890625, 11.3203125, 11.927734375, 12.53515625, 13.142578125, 13.75, 14.357421875, 14.96484375, 15.572265625, 16.1796875, 16.787109375, 17.39453125, 18.001953125, 18.609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 4.0, 14.0, 8.0, 17.0, 24.0, 13.0, 27.0, 36.0, 35.0, 48.0, 62.0, 71.0, 63.0, 84.0, 88.0, 73.0, 60.0, 51.0, 34.0, 33.0, 36.0, 29.0, 16.0, 17.0, 13.0, 10.0, 8.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-125.12419128417969, -121.61530303955078, -118.10641479492188, -114.5975341796875, -111.0886459350586, -107.57975769042969, -104.07087707519531, -100.5619888305664, -97.0531005859375, -93.5442123413086, -90.03532409667969, -86.52644348144531, -83.0175552368164, -79.5086669921875, -75.99978637695312, -72.49089813232422, -68.98200988769531, -65.4731216430664, -61.964237213134766, -58.455352783203125, -54.94646453857422, -51.43757629394531, -47.92869186401367, -44.41980743408203, -40.910919189453125, -37.40203094482422, -33.89314651489258, -30.384260177612305, -26.87537384033203, -23.366487503051758, -19.857601165771484, -16.34871482849121, -12.839820861816406, -9.330934524536133, -5.822048187255859, -2.313161849975586, 1.1957244873046875, 4.704610824584961, 8.213497161865234, 11.722383499145508, 15.231269836425781, 18.740156173706055, 22.249042510986328, 25.7579288482666, 29.266815185546875, 32.77570343017578, 36.28458786010742, 39.79347229003906, 43.30236053466797, 46.811248779296875, 50.320133209228516, 53.829017639160156, 57.33790588378906, 60.84679412841797, 64.35568237304688, 67.86456298828125, 71.37345123291016, 74.88233947753906, 78.39122009277344, 81.90010833740234, 85.40899658203125, 88.91788482666016, 92.42677307128906, 95.93565368652344, 99.44454193115234]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 5.0, 11.0, 7.0, 8.0, 15.0, 12.0, 26.0, 22.0, 27.0, 34.0, 29.0, 34.0, 38.0, 34.0, 38.0, 43.0, 47.0, 46.0, 32.0, 33.0, 39.0, 44.0, 35.0, 42.0, 38.0, 38.0, 37.0, 26.0, 20.0, 15.0, 22.0, 19.0, 18.0, 9.0, 12.0, 18.0, 8.0, 3.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-89.54629516601562, -87.0429458618164, -84.53958892822266, -82.03623962402344, -79.53289031982422, -77.029541015625, -74.52618408203125, -72.02283477783203, -69.51948547363281, -67.0161361694336, -64.51277923583984, -62.009429931640625, -59.506080627441406, -57.00272750854492, -54.49937438964844, -51.99602508544922, -49.49266815185547, -46.989315032958984, -44.485965728759766, -41.98261260986328, -39.47926330566406, -36.97591018676758, -34.472557067871094, -31.969205856323242, -29.46585464477539, -26.96250343322754, -24.459152221679688, -21.955799102783203, -19.45244789123535, -16.9490966796875, -14.445744514465332, -11.942392349243164, -9.439041137695312, -6.935689449310303, -4.432337760925293, -1.9289860725402832, 0.5743656158447266, 3.077716827392578, 5.581068992614746, 8.084421157836914, 10.587772369384766, 13.091123580932617, 15.594475746154785, 18.097827911376953, 20.601179122924805, 23.104530334472656, 25.60788345336914, 28.111234664916992, 30.614585876464844, 33.11793899536133, 35.62128829956055, 38.12464141845703, 40.62799072265625, 43.131343841552734, 45.63469696044922, 48.13804626464844, 50.64139938354492, 53.144752502441406, 55.648101806640625, 58.15145492553711, 60.654808044433594, 63.15815734863281, 65.66150665283203, 68.16486358642578, 70.668212890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 12.0, 24.0, 32.0, 44.0, 69.0, 95.0, 152.0, 197.0, 315.0, 444.0, 679.0, 994.0, 1504.0, 2203.0, 3243.0, 5054.0, 7190.0, 10846.0, 16108.0, 24199.0, 36866.0, 57281.0, 89018.0, 142174.0, 203276.0, 159389.0, 100229.0, 64158.0, 41377.0, 27044.0, 17762.0, 11889.0, 8055.0, 5426.0, 3711.0, 2378.0, 1686.0, 1085.0, 757.0, 513.0, 335.0, 221.0, 146.0, 128.0, 64.0, 60.0, 34.0, 21.0, 26.0, 4.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0], "bins": [-95.1875, -92.177734375, -89.16796875, -86.158203125, -83.1484375, -80.138671875, -77.12890625, -74.119140625, -71.109375, -68.099609375, -65.08984375, -62.080078125, -59.0703125, -56.060546875, -53.05078125, -50.041015625, -47.03125, -44.021484375, -41.01171875, -38.001953125, -34.9921875, -31.982421875, -28.97265625, -25.962890625, -22.953125, -19.943359375, -16.93359375, -13.923828125, -10.9140625, -7.904296875, -4.89453125, -1.884765625, 1.125, 4.134765625, 7.14453125, 10.154296875, 13.1640625, 16.173828125, 19.18359375, 22.193359375, 25.203125, 28.212890625, 31.22265625, 34.232421875, 37.2421875, 40.251953125, 43.26171875, 46.271484375, 49.28125, 52.291015625, 55.30078125, 58.310546875, 61.3203125, 64.330078125, 67.33984375, 70.349609375, 73.359375, 76.369140625, 79.37890625, 82.388671875, 85.3984375, 88.408203125, 91.41796875, 94.427734375, 97.4375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 7.0, 6.0, 8.0, 12.0, 16.0, 17.0, 24.0, 33.0, 33.0, 28.0, 34.0, 41.0, 28.0, 36.0, 43.0, 54.0, 49.0, 39.0, 39.0, 42.0, 43.0, 46.0, 37.0, 40.0, 35.0, 32.0, 34.0, 19.0, 18.0, 24.0, 15.0, 11.0, 11.0, 8.0, 9.0, 11.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-93.0, -90.3916015625, -87.783203125, -85.1748046875, -82.56640625, -79.9580078125, -77.349609375, -74.7412109375, -72.1328125, -69.5244140625, -66.916015625, -64.3076171875, -61.69921875, -59.0908203125, -56.482421875, -53.8740234375, -51.265625, -48.6572265625, -46.048828125, -43.4404296875, -40.83203125, -38.2236328125, -35.615234375, -33.0068359375, -30.3984375, -27.7900390625, -25.181640625, -22.5732421875, -19.96484375, -17.3564453125, -14.748046875, -12.1396484375, -9.53125, -6.9228515625, -4.314453125, -1.7060546875, 0.90234375, 3.5107421875, 6.119140625, 8.7275390625, 11.3359375, 13.9443359375, 16.552734375, 19.1611328125, 21.76953125, 24.3779296875, 26.986328125, 29.5947265625, 32.203125, 34.8115234375, 37.419921875, 40.0283203125, 42.63671875, 45.2451171875, 47.853515625, 50.4619140625, 53.0703125, 55.6787109375, 58.287109375, 60.8955078125, 63.50390625, 66.1123046875, 68.720703125, 71.3291015625, 73.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [6.0, 4.0, 4.0, 5.0, 1.0, 6.0, 12.0, 16.0, 28.0, 31.0, 38.0, 58.0, 82.0, 120.0, 173.0, 260.0, 403.0, 604.0, 816.0, 1255.0, 1846.0, 2711.0, 4182.0, 6623.0, 10072.0, 15696.0, 24913.0, 39863.0, 63703.0, 104523.0, 167050.0, 211371.0, 147841.0, 90886.0, 56324.0, 34853.0, 22104.0, 14053.0, 8968.0, 5694.0, 3752.0, 2427.0, 1642.0, 1098.0, 739.0, 548.0, 323.0, 269.0, 186.0, 138.0, 73.0, 60.0, 35.0, 29.0, 18.0, 14.0, 10.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-129.375, -125.25, -121.125, -117.0, -112.875, -108.75, -104.625, -100.5, -96.375, -92.25, -88.125, -84.0, -79.875, -75.75, -71.625, -67.5, -63.375, -59.25, -55.125, -51.0, -46.875, -42.75, -38.625, -34.5, -30.375, -26.25, -22.125, -18.0, -13.875, -9.75, -5.625, -1.5, 2.625, 6.75, 10.875, 15.0, 19.125, 23.25, 27.375, 31.5, 35.625, 39.75, 43.875, 48.0, 52.125, 56.25, 60.375, 64.5, 68.625, 72.75, 76.875, 81.0, 85.125, 89.25, 93.375, 97.5, 101.625, 105.75, 109.875, 114.0, 118.125, 122.25, 126.375, 130.5, 134.625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 2.0, 4.0, 4.0, 12.0, 9.0, 13.0, 10.0, 11.0, 12.0, 21.0, 18.0, 27.0, 22.0, 30.0, 24.0, 21.0, 35.0, 31.0, 37.0, 57.0, 33.0, 42.0, 56.0, 51.0, 41.0, 28.0, 36.0, 38.0, 43.0, 30.0, 22.0, 34.0, 19.0, 22.0, 18.0, 17.0, 11.0, 13.0, 9.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.625, -44.099609375, -42.57421875, -41.048828125, -39.5234375, -37.998046875, -36.47265625, -34.947265625, -33.421875, -31.896484375, -30.37109375, -28.845703125, -27.3203125, -25.794921875, -24.26953125, -22.744140625, -21.21875, -19.693359375, -18.16796875, -16.642578125, -15.1171875, -13.591796875, -12.06640625, -10.541015625, -9.015625, -7.490234375, -5.96484375, -4.439453125, -2.9140625, -1.388671875, 0.13671875, 1.662109375, 3.1875, 4.712890625, 6.23828125, 7.763671875, 9.2890625, 10.814453125, 12.33984375, 13.865234375, 15.390625, 16.916015625, 18.44140625, 19.966796875, 21.4921875, 23.017578125, 24.54296875, 26.068359375, 27.59375, 29.119140625, 30.64453125, 32.169921875, 33.6953125, 35.220703125, 36.74609375, 38.271484375, 39.796875, 41.322265625, 42.84765625, 44.373046875, 45.8984375, 47.423828125, 48.94921875, 50.474609375, 52.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 8.0, 21.0, 31.0, 36.0, 54.0, 85.0, 103.0, 169.0, 268.0, 396.0, 570.0, 924.0, 1300.0, 1935.0, 2953.0, 4609.0, 7268.0, 11211.0, 18543.0, 31490.0, 56343.0, 112241.0, 248774.0, 274061.0, 125109.0, 61803.0, 33886.0, 20235.0, 11931.0, 7785.0, 4947.0, 3153.0, 2072.0, 1416.0, 915.0, 616.0, 412.0, 300.0, 176.0, 144.0, 93.0, 62.0, 32.0, 26.0, 13.0, 6.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-34.6875, -33.66943359375, -32.6513671875, -31.63330078125, -30.615234375, -29.59716796875, -28.5791015625, -27.56103515625, -26.54296875, -25.52490234375, -24.5068359375, -23.48876953125, -22.470703125, -21.45263671875, -20.4345703125, -19.41650390625, -18.3984375, -17.38037109375, -16.3623046875, -15.34423828125, -14.326171875, -13.30810546875, -12.2900390625, -11.27197265625, -10.25390625, -9.23583984375, -8.2177734375, -7.19970703125, -6.181640625, -5.16357421875, -4.1455078125, -3.12744140625, -2.109375, -1.09130859375, -0.0732421875, 0.94482421875, 1.962890625, 2.98095703125, 3.9990234375, 5.01708984375, 6.03515625, 7.05322265625, 8.0712890625, 9.08935546875, 10.107421875, 11.12548828125, 12.1435546875, 13.16162109375, 14.1796875, 15.19775390625, 16.2158203125, 17.23388671875, 18.251953125, 19.27001953125, 20.2880859375, 21.30615234375, 22.32421875, 23.34228515625, 24.3603515625, 25.37841796875, 26.396484375, 27.41455078125, 28.4326171875, 29.45068359375, 30.46875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 10.0, 9.0, 30.0, 32.0, 28.0, 68.0, 75.0, 114.0, 170.0, 127.0, 82.0, 69.0, 51.0, 36.0, 17.0, 17.0, 12.0, 4.0, 8.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00492095947265625, -0.0047539472579956055, -0.004586935043334961, -0.004419922828674316, -0.004252910614013672, -0.004085898399353027, -0.003918886184692383, -0.0037518739700317383, -0.0035848617553710938, -0.0034178495407104492, -0.0032508373260498047, -0.00308382511138916, -0.0029168128967285156, -0.002749800682067871, -0.0025827884674072266, -0.002415776252746582, -0.0022487640380859375, -0.002081751823425293, -0.0019147396087646484, -0.001747727394104004, -0.0015807151794433594, -0.0014137029647827148, -0.0012466907501220703, -0.0010796785354614258, -0.0009126663208007812, -0.0007456541061401367, -0.0005786418914794922, -0.00041162967681884766, -0.0002446174621582031, -7.76052474975586e-05, 8.940696716308594e-05, 0.00025641918182373047, 0.000423431396484375, 0.0005904436111450195, 0.0007574558258056641, 0.0009244680404663086, 0.0010914802551269531, 0.0012584924697875977, 0.0014255046844482422, 0.0015925168991088867, 0.0017595291137695312, 0.0019265413284301758, 0.0020935535430908203, 0.002260565757751465, 0.0024275779724121094, 0.002594590187072754, 0.0027616024017333984, 0.002928614616394043, 0.0030956268310546875, 0.003262639045715332, 0.0034296512603759766, 0.003596663475036621, 0.0037636756896972656, 0.00393068790435791, 0.004097700119018555, 0.004264712333679199, 0.004431724548339844, 0.004598736763000488, 0.004765748977661133, 0.004932761192321777, 0.005099773406982422, 0.005266785621643066, 0.005433797836303711, 0.0056008100509643555, 0.005767822265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 10.0, 13.0, 24.0, 26.0, 55.0, 53.0, 79.0, 145.0, 190.0, 284.0, 373.0, 503.0, 686.0, 1005.0, 1281.0, 1882.0, 2659.0, 3780.0, 5578.0, 8129.0, 12536.0, 19250.0, 30144.0, 50059.0, 89445.0, 168913.0, 255632.0, 168325.0, 89393.0, 49738.0, 30067.0, 19065.0, 12491.0, 8205.0, 5482.0, 3802.0, 2599.0, 1838.0, 1351.0, 896.0, 697.0, 541.0, 409.0, 285.0, 199.0, 134.0, 108.0, 58.0, 40.0, 39.0, 26.0, 11.0, 10.0, 4.0, 4.0, 2.0, 3.0, 3.0], "bins": [-25.578125, -24.791015625, -24.00390625, -23.216796875, -22.4296875, -21.642578125, -20.85546875, -20.068359375, -19.28125, -18.494140625, -17.70703125, -16.919921875, -16.1328125, -15.345703125, -14.55859375, -13.771484375, -12.984375, -12.197265625, -11.41015625, -10.623046875, -9.8359375, -9.048828125, -8.26171875, -7.474609375, -6.6875, -5.900390625, -5.11328125, -4.326171875, -3.5390625, -2.751953125, -1.96484375, -1.177734375, -0.390625, 0.396484375, 1.18359375, 1.970703125, 2.7578125, 3.544921875, 4.33203125, 5.119140625, 5.90625, 6.693359375, 7.48046875, 8.267578125, 9.0546875, 9.841796875, 10.62890625, 11.416015625, 12.203125, 12.990234375, 13.77734375, 14.564453125, 15.3515625, 16.138671875, 16.92578125, 17.712890625, 18.5, 19.287109375, 20.07421875, 20.861328125, 21.6484375, 22.435546875, 23.22265625, 24.009765625, 24.796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 10.0, 11.0, 5.0, 5.0, 14.0, 13.0, 15.0, 15.0, 28.0, 25.0, 36.0, 30.0, 41.0, 41.0, 49.0, 61.0, 74.0, 63.0, 67.0, 51.0, 67.0, 41.0, 30.0, 23.0, 30.0, 25.0, 25.0, 16.0, 16.0, 20.0, 5.0, 9.0, 3.0, 3.0, 7.0, 4.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.96875, -9.677490234375, -9.38623046875, -9.094970703125, -8.8037109375, -8.512451171875, -8.22119140625, -7.929931640625, -7.638671875, -7.347412109375, -7.05615234375, -6.764892578125, -6.4736328125, -6.182373046875, -5.89111328125, -5.599853515625, -5.30859375, -5.017333984375, -4.72607421875, -4.434814453125, -4.1435546875, -3.852294921875, -3.56103515625, -3.269775390625, -2.978515625, -2.687255859375, -2.39599609375, -2.104736328125, -1.8134765625, -1.522216796875, -1.23095703125, -0.939697265625, -0.6484375, -0.357177734375, -0.06591796875, 0.225341796875, 0.5166015625, 0.807861328125, 1.09912109375, 1.390380859375, 1.681640625, 1.972900390625, 2.26416015625, 2.555419921875, 2.8466796875, 3.137939453125, 3.42919921875, 3.720458984375, 4.01171875, 4.302978515625, 4.59423828125, 4.885498046875, 5.1767578125, 5.468017578125, 5.75927734375, 6.050537109375, 6.341796875, 6.633056640625, 6.92431640625, 7.215576171875, 7.5068359375, 7.798095703125, 8.08935546875, 8.380615234375, 8.671875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 9.0, 17.0, 14.0, 20.0, 25.0, 27.0, 37.0, 40.0, 40.0, 65.0, 77.0, 86.0, 73.0, 80.0, 78.0, 72.0, 46.0, 32.0, 43.0, 30.0, 16.0, 11.0, 12.0, 11.0, 12.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-133.5307159423828, -129.7549285888672, -125.9791488647461, -122.20336151123047, -118.42757415771484, -114.65179443359375, -110.87600708007812, -107.1002197265625, -103.32443237304688, -99.54864501953125, -95.77286529541016, -91.99707794189453, -88.2212905883789, -84.44551086425781, -80.66972351074219, -76.89393615722656, -73.11815643310547, -69.34236907958984, -65.56658935546875, -61.790802001953125, -58.0150146484375, -54.23923110961914, -50.46344757080078, -46.687660217285156, -42.9118766784668, -39.13609313964844, -35.36030578613281, -31.584522247314453, -27.80873680114746, -24.03295135498047, -20.25716781616211, -16.481382369995117, -12.705589294433594, -8.929803848266602, -5.154019355773926, -1.37823486328125, 2.397550582885742, 6.173336029052734, 9.949119567871094, 13.724905014038086, 17.500690460205078, 21.27647590637207, 25.052261352539062, 28.828044891357422, 32.60382843017578, 36.379615783691406, 40.155399322509766, 43.931182861328125, 47.70697021484375, 51.48275375366211, 55.258541107177734, 59.034324645996094, 62.81011199951172, 66.58589172363281, 70.36167907714844, 74.13746643066406, 77.91325378417969, 81.68904113769531, 85.4648208618164, 89.24060821533203, 93.01639556884766, 96.79217529296875, 100.56796264648438, 104.34375, 108.1195297241211]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 14.0, 8.0, 10.0, 11.0, 18.0, 24.0, 15.0, 20.0, 22.0, 27.0, 35.0, 36.0, 34.0, 40.0, 58.0, 35.0, 50.0, 37.0, 34.0, 32.0, 52.0, 38.0, 48.0, 31.0, 25.0, 35.0, 28.0, 32.0, 17.0, 17.0, 17.0, 14.0, 10.0, 16.0, 10.0, 10.0, 6.0, 4.0, 5.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-87.68623352050781, -85.16998291015625, -82.65373992919922, -80.13748931884766, -77.62124633789062, -75.10499572753906, -72.58875274658203, -70.07250213623047, -67.55625915527344, -65.04000854492188, -62.523765563964844, -60.00751876831055, -57.49127197265625, -54.97502136230469, -52.45877456665039, -49.942527770996094, -47.42627716064453, -44.910030364990234, -42.39378356933594, -39.87753677368164, -37.361289978027344, -34.84503936767578, -32.328792572021484, -29.812545776367188, -27.29629898071289, -24.780052185058594, -22.263805389404297, -19.747556686401367, -17.23130989074707, -14.715063095092773, -12.19881534576416, -9.682567596435547, -7.166313171386719, -4.650065898895264, -2.1338186264038086, 0.3824286460876465, 2.8986759185791016, 5.414922714233398, 7.931170463562012, 10.447418212890625, 12.963665008544922, 15.479911804199219, 17.996158599853516, 20.512407302856445, 23.028654098510742, 25.54490089416504, 28.06114959716797, 30.577396392822266, 33.09364318847656, 35.60988998413086, 38.126136779785156, 40.64238357543945, 43.15863037109375, 45.67488098144531, 48.19112777709961, 50.707374572753906, 53.2236213684082, 55.7398681640625, 58.2561149597168, 60.772361755371094, 63.288612365722656, 65.80485534667969, 68.32110595703125, 70.83735656738281, 73.35359954833984]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 11.0, 19.0, 14.0, 29.0, 32.0, 55.0, 74.0, 103.0, 119.0, 210.0, 282.0, 412.0, 556.0, 895.0, 1187.0, 1883.0, 2776.0, 4309.0, 6704.0, 10315.0, 17003.0, 28306.0, 48684.0, 88053.0, 187379.0, 630551.0, 1835347.0, 857478.0, 225933.0, 101559.0, 55886.0, 32868.0, 19804.0, 12638.0, 8068.0, 5071.0, 3309.0, 2185.0, 1377.0, 940.0, 616.0, 411.0, 274.0, 193.0, 130.0, 78.0, 56.0, 38.0, 23.0, 8.0, 7.0, 13.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0], "bins": [-133.75, -129.6484375, -125.546875, -121.4453125, -117.34375, -113.2421875, -109.140625, -105.0390625, -100.9375, -96.8359375, -92.734375, -88.6328125, -84.53125, -80.4296875, -76.328125, -72.2265625, -68.125, -64.0234375, -59.921875, -55.8203125, -51.71875, -47.6171875, -43.515625, -39.4140625, -35.3125, -31.2109375, -27.109375, -23.0078125, -18.90625, -14.8046875, -10.703125, -6.6015625, -2.5, 1.6015625, 5.703125, 9.8046875, 13.90625, 18.0078125, 22.109375, 26.2109375, 30.3125, 34.4140625, 38.515625, 42.6171875, 46.71875, 50.8203125, 54.921875, 59.0234375, 63.125, 67.2265625, 71.328125, 75.4296875, 79.53125, 83.6328125, 87.734375, 91.8359375, 95.9375, 100.0390625, 104.140625, 108.2421875, 112.34375, 116.4453125, 120.546875, 124.6484375, 128.75]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 9.0, 14.0, 11.0, 11.0, 20.0, 20.0, 22.0, 17.0, 32.0, 26.0, 26.0, 38.0, 52.0, 47.0, 46.0, 47.0, 42.0, 46.0, 32.0, 48.0, 42.0, 36.0, 39.0, 33.0, 37.0, 30.0, 24.0, 31.0, 16.0, 16.0, 18.0, 15.0, 9.0, 12.0, 9.0, 2.0, 3.0, 5.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-72.25, -70.15234375, -68.0546875, -65.95703125, -63.859375, -61.76171875, -59.6640625, -57.56640625, -55.46875, -53.37109375, -51.2734375, -49.17578125, -47.078125, -44.98046875, -42.8828125, -40.78515625, -38.6875, -36.58984375, -34.4921875, -32.39453125, -30.296875, -28.19921875, -26.1015625, -24.00390625, -21.90625, -19.80859375, -17.7109375, -15.61328125, -13.515625, -11.41796875, -9.3203125, -7.22265625, -5.125, -3.02734375, -0.9296875, 1.16796875, 3.265625, 5.36328125, 7.4609375, 9.55859375, 11.65625, 13.75390625, 15.8515625, 17.94921875, 20.046875, 22.14453125, 24.2421875, 26.33984375, 28.4375, 30.53515625, 32.6328125, 34.73046875, 36.828125, 38.92578125, 41.0234375, 43.12109375, 45.21875, 47.31640625, 49.4140625, 51.51171875, 53.609375, 55.70703125, 57.8046875, 59.90234375, 62.0]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 10.0, 7.0, 10.0, 19.0, 17.0, 40.0, 50.0, 89.0, 114.0, 193.0, 280.0, 424.0, 602.0, 905.0, 1415.0, 2100.0, 3419.0, 5309.0, 8701.0, 13909.0, 23288.0, 40078.0, 72269.0, 138113.0, 291672.0, 795463.0, 1711127.0, 583313.0, 235998.0, 115113.0, 61729.0, 34852.0, 20393.0, 12335.0, 7590.0, 4657.0, 3061.0, 1885.0, 1269.0, 812.0, 571.0, 349.0, 246.0, 159.0, 101.0, 82.0, 44.0, 29.0, 29.0, 19.0, 10.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-115.5, -111.931640625, -108.36328125, -104.794921875, -101.2265625, -97.658203125, -94.08984375, -90.521484375, -86.953125, -83.384765625, -79.81640625, -76.248046875, -72.6796875, -69.111328125, -65.54296875, -61.974609375, -58.40625, -54.837890625, -51.26953125, -47.701171875, -44.1328125, -40.564453125, -36.99609375, -33.427734375, -29.859375, -26.291015625, -22.72265625, -19.154296875, -15.5859375, -12.017578125, -8.44921875, -4.880859375, -1.3125, 2.255859375, 5.82421875, 9.392578125, 12.9609375, 16.529296875, 20.09765625, 23.666015625, 27.234375, 30.802734375, 34.37109375, 37.939453125, 41.5078125, 45.076171875, 48.64453125, 52.212890625, 55.78125, 59.349609375, 62.91796875, 66.486328125, 70.0546875, 73.623046875, 77.19140625, 80.759765625, 84.328125, 87.896484375, 91.46484375, 95.033203125, 98.6015625, 102.169921875, 105.73828125, 109.306640625, 112.875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 6.0, 10.0, 9.0, 14.0, 20.0, 19.0, 21.0, 30.0, 34.0, 35.0, 45.0, 62.0, 86.0, 87.0, 117.0, 158.0, 162.0, 239.0, 259.0, 396.0, 427.0, 376.0, 284.0, 231.0, 190.0, 127.0, 121.0, 113.0, 83.0, 68.0, 47.0, 36.0, 32.0, 23.0, 27.0, 12.0, 11.0, 9.0, 8.0, 16.0, 11.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.53125, -34.4033203125, -33.275390625, -32.1474609375, -31.01953125, -29.8916015625, -28.763671875, -27.6357421875, -26.5078125, -25.3798828125, -24.251953125, -23.1240234375, -21.99609375, -20.8681640625, -19.740234375, -18.6123046875, -17.484375, -16.3564453125, -15.228515625, -14.1005859375, -12.97265625, -11.8447265625, -10.716796875, -9.5888671875, -8.4609375, -7.3330078125, -6.205078125, -5.0771484375, -3.94921875, -2.8212890625, -1.693359375, -0.5654296875, 0.5625, 1.6904296875, 2.818359375, 3.9462890625, 5.07421875, 6.2021484375, 7.330078125, 8.4580078125, 9.5859375, 10.7138671875, 11.841796875, 12.9697265625, 14.09765625, 15.2255859375, 16.353515625, 17.4814453125, 18.609375, 19.7373046875, 20.865234375, 21.9931640625, 23.12109375, 24.2490234375, 25.376953125, 26.5048828125, 27.6328125, 28.7607421875, 29.888671875, 31.0166015625, 32.14453125, 33.2724609375, 34.400390625, 35.5283203125, 36.65625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 7.0, 5.0, 20.0, 24.0, 27.0, 39.0, 28.0, 41.0, 41.0, 66.0, 80.0, 75.0, 93.0, 101.0, 62.0, 61.0, 46.0, 34.0, 31.0, 28.0, 20.0, 13.0, 13.0, 9.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-138.45950317382812, -134.84710693359375, -131.2346954345703, -127.6222915649414, -124.0098876953125, -120.3974838256836, -116.78507995605469, -113.17267608642578, -109.56027221679688, -105.94786834716797, -102.33546447753906, -98.72306060791016, -95.11065673828125, -91.49825286865234, -87.88584899902344, -84.27344512939453, -80.66104125976562, -77.04863739013672, -73.43623352050781, -69.8238296508789, -66.21142578125, -62.599021911621094, -58.98661804199219, -55.37421417236328, -51.761810302734375, -48.14940643310547, -44.53700256347656, -40.924598693847656, -37.31219482421875, -33.699790954589844, -30.087387084960938, -26.47498321533203, -22.862579345703125, -19.25017547607422, -15.637771606445312, -12.025367736816406, -8.4129638671875, -4.800559997558594, -1.1881561279296875, 2.4242477416992188, 6.036651611328125, 9.649055480957031, 13.261459350585938, 16.873863220214844, 20.48626708984375, 24.098670959472656, 27.711074829101562, 31.32347869873047, 34.935882568359375, 38.54828643798828, 42.16069030761719, 45.773094177246094, 49.385498046875, 52.997901916503906, 56.61030578613281, 60.22270965576172, 63.835113525390625, 67.44751739501953, 71.05992126464844, 74.67232513427734, 78.28472900390625, 81.89713287353516, 85.50953674316406, 89.12194061279297, 92.73434448242188]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 8.0, 10.0, 8.0, 7.0, 14.0, 22.0, 21.0, 29.0, 28.0, 23.0, 28.0, 37.0, 30.0, 36.0, 54.0, 43.0, 43.0, 52.0, 48.0, 48.0, 43.0, 36.0, 32.0, 33.0, 30.0, 32.0, 32.0, 30.0, 15.0, 16.0, 16.0, 15.0, 13.0, 11.0, 10.0, 7.0, 4.0, 3.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.64378356933594, -71.24819946289062, -68.85261535644531, -66.45703887939453, -64.06145477294922, -61.665870666503906, -59.270286560058594, -56.87470245361328, -54.479122161865234, -52.08353805541992, -49.687957763671875, -47.29237365722656, -44.89678955078125, -42.5012092590332, -40.10562515258789, -37.710044860839844, -35.31446075439453, -32.91887664794922, -30.523296356201172, -28.12771224975586, -25.73213005065918, -23.3365478515625, -20.940963745117188, -18.545381546020508, -16.149799346923828, -13.754217147827148, -11.358633995056152, -8.963050842285156, -6.567468643188477, -4.171886444091797, -1.7763032913208008, 0.6192798614501953, 3.0148544311523438, 5.410437107086182, 7.8060197830200195, 10.201602935791016, 12.597185134887695, 14.992767333984375, 17.388351440429688, 19.783933639526367, 22.179515838623047, 24.575098037719727, 26.970680236816406, 29.36626434326172, 31.7618465423584, 34.15742874145508, 36.55301284790039, 38.94859313964844, 41.34417724609375, 43.73976135253906, 46.13534164428711, 48.53092575073242, 50.92650604248047, 53.32209014892578, 55.717674255371094, 58.113258361816406, 60.50883865356445, 62.904422760009766, 65.30000305175781, 67.69558715820312, 70.09117126464844, 72.48675537109375, 74.88233184814453, 77.27791595458984, 79.67350006103516]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 14.0, 21.0, 33.0, 41.0, 58.0, 69.0, 122.0, 198.0, 276.0, 397.0, 624.0, 912.0, 1322.0, 1827.0, 2915.0, 4343.0, 6503.0, 9940.0, 15338.0, 23651.0, 36824.0, 58933.0, 93955.0, 150048.0, 202967.0, 160531.0, 101126.0, 62567.0, 39714.0, 25510.0, 16402.0, 10563.0, 6899.0, 4569.0, 3042.0, 2045.0, 1306.0, 932.0, 638.0, 464.0, 291.0, 180.0, 142.0, 113.0, 68.0, 33.0, 22.0, 22.0, 19.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-97.5625, -94.47265625, -91.3828125, -88.29296875, -85.203125, -82.11328125, -79.0234375, -75.93359375, -72.84375, -69.75390625, -66.6640625, -63.57421875, -60.484375, -57.39453125, -54.3046875, -51.21484375, -48.125, -45.03515625, -41.9453125, -38.85546875, -35.765625, -32.67578125, -29.5859375, -26.49609375, -23.40625, -20.31640625, -17.2265625, -14.13671875, -11.046875, -7.95703125, -4.8671875, -1.77734375, 1.3125, 4.40234375, 7.4921875, 10.58203125, 13.671875, 16.76171875, 19.8515625, 22.94140625, 26.03125, 29.12109375, 32.2109375, 35.30078125, 38.390625, 41.48046875, 44.5703125, 47.66015625, 50.75, 53.83984375, 56.9296875, 60.01953125, 63.109375, 66.19921875, 69.2890625, 72.37890625, 75.46875, 78.55859375, 81.6484375, 84.73828125, 87.828125, 90.91796875, 94.0078125, 97.09765625, 100.1875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 3.0, 1.0, 6.0, 7.0, 8.0, 11.0, 15.0, 14.0, 19.0, 31.0, 25.0, 28.0, 35.0, 26.0, 36.0, 49.0, 52.0, 34.0, 49.0, 52.0, 57.0, 56.0, 36.0, 37.0, 28.0, 43.0, 32.0, 34.0, 33.0, 25.0, 17.0, 17.0, 13.0, 13.0, 11.0, 10.0, 11.0, 2.0, 4.0, 3.0, 6.0, 4.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.5625, -62.53515625, -60.5078125, -58.48046875, -56.453125, -54.42578125, -52.3984375, -50.37109375, -48.34375, -46.31640625, -44.2890625, -42.26171875, -40.234375, -38.20703125, -36.1796875, -34.15234375, -32.125, -30.09765625, -28.0703125, -26.04296875, -24.015625, -21.98828125, -19.9609375, -17.93359375, -15.90625, -13.87890625, -11.8515625, -9.82421875, -7.796875, -5.76953125, -3.7421875, -1.71484375, 0.3125, 2.33984375, 4.3671875, 6.39453125, 8.421875, 10.44921875, 12.4765625, 14.50390625, 16.53125, 18.55859375, 20.5859375, 22.61328125, 24.640625, 26.66796875, 28.6953125, 30.72265625, 32.75, 34.77734375, 36.8046875, 38.83203125, 40.859375, 42.88671875, 44.9140625, 46.94140625, 48.96875, 50.99609375, 53.0234375, 55.05078125, 57.078125, 59.10546875, 61.1328125, 63.16015625, 65.1875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 6.0, 15.0, 14.0, 26.0, 29.0, 51.0, 71.0, 89.0, 134.0, 204.0, 268.0, 452.0, 605.0, 999.0, 1445.0, 2177.0, 3375.0, 5440.0, 8817.0, 14969.0, 26013.0, 47212.0, 91576.0, 193380.0, 301798.0, 167041.0, 80722.0, 42159.0, 23484.0, 13572.0, 8147.0, 4956.0, 3176.0, 2060.0, 1354.0, 881.0, 593.0, 375.0, 281.0, 208.0, 131.0, 84.0, 70.0, 40.0, 21.0, 16.0, 11.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-169.5, -164.26953125, -159.0390625, -153.80859375, -148.578125, -143.34765625, -138.1171875, -132.88671875, -127.65625, -122.42578125, -117.1953125, -111.96484375, -106.734375, -101.50390625, -96.2734375, -91.04296875, -85.8125, -80.58203125, -75.3515625, -70.12109375, -64.890625, -59.66015625, -54.4296875, -49.19921875, -43.96875, -38.73828125, -33.5078125, -28.27734375, -23.046875, -17.81640625, -12.5859375, -7.35546875, -2.125, 3.10546875, 8.3359375, 13.56640625, 18.796875, 24.02734375, 29.2578125, 34.48828125, 39.71875, 44.94921875, 50.1796875, 55.41015625, 60.640625, 65.87109375, 71.1015625, 76.33203125, 81.5625, 86.79296875, 92.0234375, 97.25390625, 102.484375, 107.71484375, 112.9453125, 118.17578125, 123.40625, 128.63671875, 133.8671875, 139.09765625, 144.328125, 149.55859375, 154.7890625, 160.01953125, 165.25]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 10.0, 7.0, 8.0, 14.0, 14.0, 14.0, 25.0, 21.0, 16.0, 27.0, 38.0, 37.0, 28.0, 42.0, 46.0, 37.0, 41.0, 45.0, 43.0, 33.0, 51.0, 34.0, 37.0, 35.0, 34.0, 43.0, 24.0, 22.0, 25.0, 23.0, 13.0, 15.0, 16.0, 12.0, 9.0, 6.0, 8.0, 5.0, 10.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-56.5625, -54.79833984375, -53.0341796875, -51.27001953125, -49.505859375, -47.74169921875, -45.9775390625, -44.21337890625, -42.44921875, -40.68505859375, -38.9208984375, -37.15673828125, -35.392578125, -33.62841796875, -31.8642578125, -30.10009765625, -28.3359375, -26.57177734375, -24.8076171875, -23.04345703125, -21.279296875, -19.51513671875, -17.7509765625, -15.98681640625, -14.22265625, -12.45849609375, -10.6943359375, -8.93017578125, -7.166015625, -5.40185546875, -3.6376953125, -1.87353515625, -0.109375, 1.65478515625, 3.4189453125, 5.18310546875, 6.947265625, 8.71142578125, 10.4755859375, 12.23974609375, 14.00390625, 15.76806640625, 17.5322265625, 19.29638671875, 21.060546875, 22.82470703125, 24.5888671875, 26.35302734375, 28.1171875, 29.88134765625, 31.6455078125, 33.40966796875, 35.173828125, 36.93798828125, 38.7021484375, 40.46630859375, 42.23046875, 43.99462890625, 45.7587890625, 47.52294921875, 49.287109375, 51.05126953125, 52.8154296875, 54.57958984375, 56.34375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 7.0, 19.0, 22.0, 36.0, 50.0, 72.0, 108.0, 169.0, 198.0, 375.0, 600.0, 883.0, 1375.0, 2328.0, 3837.0, 6596.0, 12337.0, 26910.0, 79133.0, 524016.0, 285298.0, 57454.0, 21479.0, 10566.0, 5634.0, 3358.0, 2069.0, 1290.0, 849.0, 532.0, 327.0, 205.0, 138.0, 82.0, 72.0, 48.0, 25.0, 16.0, 7.0, 12.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-88.6875, -86.0693359375, -83.451171875, -80.8330078125, -78.21484375, -75.5966796875, -72.978515625, -70.3603515625, -67.7421875, -65.1240234375, -62.505859375, -59.8876953125, -57.26953125, -54.6513671875, -52.033203125, -49.4150390625, -46.796875, -44.1787109375, -41.560546875, -38.9423828125, -36.32421875, -33.7060546875, -31.087890625, -28.4697265625, -25.8515625, -23.2333984375, -20.615234375, -17.9970703125, -15.37890625, -12.7607421875, -10.142578125, -7.5244140625, -4.90625, -2.2880859375, 0.330078125, 2.9482421875, 5.56640625, 8.1845703125, 10.802734375, 13.4208984375, 16.0390625, 18.6572265625, 21.275390625, 23.8935546875, 26.51171875, 29.1298828125, 31.748046875, 34.3662109375, 36.984375, 39.6025390625, 42.220703125, 44.8388671875, 47.45703125, 50.0751953125, 52.693359375, 55.3115234375, 57.9296875, 60.5478515625, 63.166015625, 65.7841796875, 68.40234375, 71.0205078125, 73.638671875, 76.2568359375, 78.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 8.0, 19.0, 24.0, 52.0, 98.0, 225.0, 281.0, 89.0, 72.0, 40.0, 12.0, 16.0, 12.0, 6.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012359619140625, -0.011920452117919922, -0.011481285095214844, -0.011042118072509766, -0.010602951049804688, -0.01016378402709961, -0.009724617004394531, -0.009285449981689453, -0.008846282958984375, -0.008407115936279297, -0.007967948913574219, -0.007528781890869141, -0.0070896148681640625, -0.006650447845458984, -0.006211280822753906, -0.005772113800048828, -0.00533294677734375, -0.004893779754638672, -0.004454612731933594, -0.004015445709228516, -0.0035762786865234375, -0.0031371116638183594, -0.0026979446411132812, -0.002258777618408203, -0.001819610595703125, -0.0013804435729980469, -0.0009412765502929688, -0.0005021095275878906, -6.29425048828125e-05, 0.0003762245178222656, 0.0008153915405273438, 0.0012545585632324219, 0.0016937255859375, 0.002132892608642578, 0.0025720596313476562, 0.0030112266540527344, 0.0034503936767578125, 0.0038895606994628906, 0.004328727722167969, 0.004767894744873047, 0.005207061767578125, 0.005646228790283203, 0.006085395812988281, 0.006524562835693359, 0.0069637298583984375, 0.007402896881103516, 0.007842063903808594, 0.008281230926513672, 0.00872039794921875, 0.009159564971923828, 0.009598731994628906, 0.010037899017333984, 0.010477066040039062, 0.01091623306274414, 0.011355400085449219, 0.011794567108154297, 0.012233734130859375, 0.012672901153564453, 0.013112068176269531, 0.01355123519897461, 0.013990402221679688, 0.014429569244384766, 0.014868736267089844, 0.015307903289794922, 0.0157470703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 13.0, 11.0, 18.0, 18.0, 37.0, 50.0, 56.0, 118.0, 166.0, 231.0, 381.0, 534.0, 854.0, 1202.0, 1742.0, 2720.0, 4026.0, 5883.0, 9786.0, 17114.0, 32652.0, 81597.0, 320462.0, 393386.0, 92535.0, 35811.0, 17655.0, 10295.0, 6364.0, 4159.0, 2898.0, 1953.0, 1228.0, 845.0, 603.0, 377.0, 224.0, 169.0, 115.0, 84.0, 53.0, 33.0, 31.0, 19.0, 17.0, 6.0, 5.0, 2.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-73.6875, -71.388671875, -69.08984375, -66.791015625, -64.4921875, -62.193359375, -59.89453125, -57.595703125, -55.296875, -52.998046875, -50.69921875, -48.400390625, -46.1015625, -43.802734375, -41.50390625, -39.205078125, -36.90625, -34.607421875, -32.30859375, -30.009765625, -27.7109375, -25.412109375, -23.11328125, -20.814453125, -18.515625, -16.216796875, -13.91796875, -11.619140625, -9.3203125, -7.021484375, -4.72265625, -2.423828125, -0.125, 2.173828125, 4.47265625, 6.771484375, 9.0703125, 11.369140625, 13.66796875, 15.966796875, 18.265625, 20.564453125, 22.86328125, 25.162109375, 27.4609375, 29.759765625, 32.05859375, 34.357421875, 36.65625, 38.955078125, 41.25390625, 43.552734375, 45.8515625, 48.150390625, 50.44921875, 52.748046875, 55.046875, 57.345703125, 59.64453125, 61.943359375, 64.2421875, 66.541015625, 68.83984375, 71.138671875, 73.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 11.0, 6.0, 8.0, 6.0, 5.0, 6.0, 13.0, 16.0, 24.0, 29.0, 28.0, 50.0, 63.0, 83.0, 123.0, 141.0, 78.0, 66.0, 46.0, 29.0, 34.0, 30.0, 21.0, 15.0, 8.0, 9.0, 7.0, 12.0, 4.0, 7.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.52734375, -17.8203125, -17.11328125, -16.40625, -15.69921875, -14.9921875, -14.28515625, -13.578125, -12.87109375, -12.1640625, -11.45703125, -10.75, -10.04296875, -9.3359375, -8.62890625, -7.921875, -7.21484375, -6.5078125, -5.80078125, -5.09375, -4.38671875, -3.6796875, -2.97265625, -2.265625, -1.55859375, -0.8515625, -0.14453125, 0.5625, 1.26953125, 1.9765625, 2.68359375, 3.390625, 4.09765625, 4.8046875, 5.51171875, 6.21875, 6.92578125, 7.6328125, 8.33984375, 9.046875, 9.75390625, 10.4609375, 11.16796875, 11.875, 12.58203125, 13.2890625, 13.99609375, 14.703125, 15.41015625, 16.1171875, 16.82421875, 17.53125, 18.23828125, 18.9453125, 19.65234375, 20.359375, 21.06640625, 21.7734375, 22.48046875, 23.1875, 23.89453125, 24.6015625, 25.30859375, 26.015625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 8.0, 10.0, 13.0, 22.0, 28.0, 41.0, 52.0, 77.0, 106.0, 129.0, 123.0, 121.0, 73.0, 54.0, 46.0, 29.0, 23.0, 19.0, 14.0, 8.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.34735107421875, -130.0435333251953, -125.73973083496094, -121.4359130859375, -117.1321029663086, -112.82829284667969, -108.52448272705078, -104.22067260742188, -99.91685485839844, -95.61304473876953, -91.30923461914062, -87.00541687011719, -82.70160675048828, -78.39779663085938, -74.09398651123047, -69.79017639160156, -65.48636627197266, -61.18255615234375, -56.87874221801758, -52.57493209838867, -48.2711181640625, -43.967308044433594, -39.66349792480469, -35.35968780517578, -31.05587387084961, -26.75206184387207, -22.44824981689453, -18.144439697265625, -13.840627670288086, -9.536815643310547, -5.233005523681641, -0.9291934967041016, 3.3746185302734375, 7.678430080413818, 11.9822416305542, 16.286052703857422, 20.58986473083496, 24.8936767578125, 29.197486877441406, 33.50129699707031, 37.805110931396484, 42.10892105102539, 46.41273498535156, 50.71654510498047, 55.020355224609375, 59.32416915893555, 63.62797927856445, 67.93179321289062, 72.23560333251953, 76.53941345214844, 80.84322357177734, 85.14703369140625, 89.45085144042969, 93.7546615600586, 98.0584716796875, 102.3622817993164, 106.66609191894531, 110.96990203857422, 115.27371215820312, 119.57752990722656, 123.88134002685547, 128.18515014648438, 132.48895263671875, 136.7927703857422, 141.09658813476562]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 3.0, 11.0, 0.0, 2.0, 7.0, 7.0, 10.0, 7.0, 14.0, 14.0, 12.0, 23.0, 32.0, 28.0, 33.0, 34.0, 41.0, 29.0, 42.0, 36.0, 51.0, 47.0, 51.0, 44.0, 39.0, 40.0, 42.0, 30.0, 33.0, 29.0, 30.0, 27.0, 28.0, 22.0, 17.0, 12.0, 16.0, 7.0, 8.0, 14.0, 11.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.6181526184082, -61.656272888183594, -59.694393157958984, -57.732513427734375, -55.770633697509766, -53.808753967285156, -51.84687423706055, -49.88499450683594, -47.92311477661133, -45.96123504638672, -43.99935531616211, -42.0374755859375, -40.07559585571289, -38.11371612548828, -36.15183639526367, -34.18995666503906, -32.22807693481445, -30.266197204589844, -28.304317474365234, -26.342437744140625, -24.380558013916016, -22.418678283691406, -20.456798553466797, -18.494918823242188, -16.533039093017578, -14.571159362792969, -12.60927963256836, -10.64739990234375, -8.68552017211914, -6.723640441894531, -4.761760711669922, -2.7998809814453125, -0.8380050659179688, 1.1238746643066406, 3.08575439453125, 5.047634124755859, 7.009513854980469, 8.971393585205078, 10.933273315429688, 12.895153045654297, 14.857032775878906, 16.818912506103516, 18.780792236328125, 20.742671966552734, 22.704551696777344, 24.666431427001953, 26.628311157226562, 28.590190887451172, 30.55207061767578, 32.51395034790039, 34.475830078125, 36.43770980834961, 38.39958953857422, 40.36146926879883, 42.32334899902344, 44.28522872924805, 46.247108459472656, 48.208988189697266, 50.170867919921875, 52.132747650146484, 54.094627380371094, 56.0565071105957, 58.01838684082031, 59.98026657104492, 61.94214630126953]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 12.0, 16.0, 19.0, 34.0, 46.0, 61.0, 98.0, 141.0, 229.0, 331.0, 459.0, 718.0, 1187.0, 1768.0, 2722.0, 4268.0, 6802.0, 10662.0, 17295.0, 28020.0, 46306.0, 76621.0, 127731.0, 204091.0, 201055.0, 124722.0, 74656.0, 45253.0, 27464.0, 16742.0, 10535.0, 6455.0, 4175.0, 2676.0, 1787.0, 1200.0, 748.0, 482.0, 333.0, 203.0, 138.0, 109.0, 66.0, 41.0, 27.0, 19.0, 10.0, 9.0, 7.0, 3.0, 3.0, 0.0, 3.0, 2.0], "bins": [-75.1875, -72.974609375, -70.76171875, -68.548828125, -66.3359375, -64.123046875, -61.91015625, -59.697265625, -57.484375, -55.271484375, -53.05859375, -50.845703125, -48.6328125, -46.419921875, -44.20703125, -41.994140625, -39.78125, -37.568359375, -35.35546875, -33.142578125, -30.9296875, -28.716796875, -26.50390625, -24.291015625, -22.078125, -19.865234375, -17.65234375, -15.439453125, -13.2265625, -11.013671875, -8.80078125, -6.587890625, -4.375, -2.162109375, 0.05078125, 2.263671875, 4.4765625, 6.689453125, 8.90234375, 11.115234375, 13.328125, 15.541015625, 17.75390625, 19.966796875, 22.1796875, 24.392578125, 26.60546875, 28.818359375, 31.03125, 33.244140625, 35.45703125, 37.669921875, 39.8828125, 42.095703125, 44.30859375, 46.521484375, 48.734375, 50.947265625, 53.16015625, 55.373046875, 57.5859375, 59.798828125, 62.01171875, 64.224609375, 66.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 1.0, 4.0, 2.0, 5.0, 11.0, 6.0, 10.0, 15.0, 12.0, 26.0, 22.0, 22.0, 30.0, 31.0, 39.0, 41.0, 33.0, 35.0, 47.0, 44.0, 54.0, 45.0, 36.0, 39.0, 48.0, 31.0, 45.0, 40.0, 28.0, 30.0, 23.0, 23.0, 17.0, 20.0, 16.0, 12.0, 9.0, 4.0, 3.0, 12.0, 9.0, 1.0, 4.0, 2.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.0625, -52.27001953125, -50.4775390625, -48.68505859375, -46.892578125, -45.10009765625, -43.3076171875, -41.51513671875, -39.72265625, -37.93017578125, -36.1376953125, -34.34521484375, -32.552734375, -30.76025390625, -28.9677734375, -27.17529296875, -25.3828125, -23.59033203125, -21.7978515625, -20.00537109375, -18.212890625, -16.42041015625, -14.6279296875, -12.83544921875, -11.04296875, -9.25048828125, -7.4580078125, -5.66552734375, -3.873046875, -2.08056640625, -0.2880859375, 1.50439453125, 3.296875, 5.08935546875, 6.8818359375, 8.67431640625, 10.466796875, 12.25927734375, 14.0517578125, 15.84423828125, 17.63671875, 19.42919921875, 21.2216796875, 23.01416015625, 24.806640625, 26.59912109375, 28.3916015625, 30.18408203125, 31.9765625, 33.76904296875, 35.5615234375, 37.35400390625, 39.146484375, 40.93896484375, 42.7314453125, 44.52392578125, 46.31640625, 48.10888671875, 49.9013671875, 51.69384765625, 53.486328125, 55.27880859375, 57.0712890625, 58.86376953125, 60.65625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 10.0, 9.0, 21.0, 27.0, 31.0, 77.0, 86.0, 131.0, 172.0, 243.0, 413.0, 520.0, 748.0, 1167.0, 1663.0, 2524.0, 3729.0, 5382.0, 8103.0, 12290.0, 19038.0, 29361.0, 46655.0, 74970.0, 124149.0, 192016.0, 191574.0, 124685.0, 75751.0, 46728.0, 29480.0, 18988.0, 12366.0, 8323.0, 5386.0, 3740.0, 2551.0, 1738.0, 1135.0, 827.0, 543.0, 394.0, 262.0, 174.0, 109.0, 87.0, 67.0, 37.0, 33.0, 15.0, 13.0, 7.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-99.4375, -96.4248046875, -93.412109375, -90.3994140625, -87.38671875, -84.3740234375, -81.361328125, -78.3486328125, -75.3359375, -72.3232421875, -69.310546875, -66.2978515625, -63.28515625, -60.2724609375, -57.259765625, -54.2470703125, -51.234375, -48.2216796875, -45.208984375, -42.1962890625, -39.18359375, -36.1708984375, -33.158203125, -30.1455078125, -27.1328125, -24.1201171875, -21.107421875, -18.0947265625, -15.08203125, -12.0693359375, -9.056640625, -6.0439453125, -3.03125, -0.0185546875, 2.994140625, 6.0068359375, 9.01953125, 12.0322265625, 15.044921875, 18.0576171875, 21.0703125, 24.0830078125, 27.095703125, 30.1083984375, 33.12109375, 36.1337890625, 39.146484375, 42.1591796875, 45.171875, 48.1845703125, 51.197265625, 54.2099609375, 57.22265625, 60.2353515625, 63.248046875, 66.2607421875, 69.2734375, 72.2861328125, 75.298828125, 78.3115234375, 81.32421875, 84.3369140625, 87.349609375, 90.3623046875, 93.375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 10.0, 5.0, 5.0, 14.0, 16.0, 16.0, 10.0, 20.0, 25.0, 31.0, 25.0, 25.0, 27.0, 32.0, 32.0, 32.0, 38.0, 38.0, 36.0, 38.0, 37.0, 49.0, 36.0, 22.0, 34.0, 34.0, 35.0, 36.0, 31.0, 26.0, 27.0, 14.0, 18.0, 22.0, 13.0, 11.0, 13.0, 8.0, 9.0, 9.0, 5.0, 13.0, 4.0, 3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-38.84375, -37.69384765625, -36.5439453125, -35.39404296875, -34.244140625, -33.09423828125, -31.9443359375, -30.79443359375, -29.64453125, -28.49462890625, -27.3447265625, -26.19482421875, -25.044921875, -23.89501953125, -22.7451171875, -21.59521484375, -20.4453125, -19.29541015625, -18.1455078125, -16.99560546875, -15.845703125, -14.69580078125, -13.5458984375, -12.39599609375, -11.24609375, -10.09619140625, -8.9462890625, -7.79638671875, -6.646484375, -5.49658203125, -4.3466796875, -3.19677734375, -2.046875, -0.89697265625, 0.2529296875, 1.40283203125, 2.552734375, 3.70263671875, 4.8525390625, 6.00244140625, 7.15234375, 8.30224609375, 9.4521484375, 10.60205078125, 11.751953125, 12.90185546875, 14.0517578125, 15.20166015625, 16.3515625, 17.50146484375, 18.6513671875, 19.80126953125, 20.951171875, 22.10107421875, 23.2509765625, 24.40087890625, 25.55078125, 26.70068359375, 27.8505859375, 29.00048828125, 30.150390625, 31.30029296875, 32.4501953125, 33.60009765625, 34.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 18.0, 9.0, 29.0, 40.0, 58.0, 83.0, 121.0, 165.0, 236.0, 385.0, 528.0, 743.0, 1138.0, 1768.0, 2636.0, 4227.0, 6845.0, 11684.0, 19872.0, 35091.0, 64425.0, 125521.0, 236923.0, 245870.0, 132498.0, 68463.0, 36765.0, 20720.0, 12067.0, 7096.0, 4336.0, 2723.0, 1754.0, 1168.0, 790.0, 518.0, 411.0, 244.0, 169.0, 143.0, 89.0, 61.0, 42.0, 29.0, 19.0, 11.0, 8.0, 3.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.311279296875, -18.62255859375, -17.933837890625, -17.2451171875, -16.556396484375, -15.86767578125, -15.178955078125, -14.490234375, -13.801513671875, -13.11279296875, -12.424072265625, -11.7353515625, -11.046630859375, -10.35791015625, -9.669189453125, -8.98046875, -8.291748046875, -7.60302734375, -6.914306640625, -6.2255859375, -5.536865234375, -4.84814453125, -4.159423828125, -3.470703125, -2.781982421875, -2.09326171875, -1.404541015625, -0.7158203125, -0.027099609375, 0.66162109375, 1.350341796875, 2.0390625, 2.727783203125, 3.41650390625, 4.105224609375, 4.7939453125, 5.482666015625, 6.17138671875, 6.860107421875, 7.548828125, 8.237548828125, 8.92626953125, 9.614990234375, 10.3037109375, 10.992431640625, 11.68115234375, 12.369873046875, 13.05859375, 13.747314453125, 14.43603515625, 15.124755859375, 15.8134765625, 16.502197265625, 17.19091796875, 17.879638671875, 18.568359375, 19.257080078125, 19.94580078125, 20.634521484375, 21.3232421875, 22.011962890625, 22.70068359375, 23.389404296875, 24.078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 7.0, 5.0, 8.0, 10.0, 5.0, 18.0, 17.0, 24.0, 33.0, 38.0, 47.0, 46.0, 65.0, 83.0, 88.0, 95.0, 96.0, 81.0, 41.0, 39.0, 38.0, 21.0, 28.0, 10.0, 10.0, 11.0, 5.0, 8.0, 6.0, 5.0, 9.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002193450927734375, -0.002114593982696533, -0.0020357370376586914, -0.0019568800926208496, -0.0018780231475830078, -0.001799166202545166, -0.0017203092575073242, -0.0016414523124694824, -0.0015625953674316406, -0.0014837384223937988, -0.001404881477355957, -0.0013260245323181152, -0.0012471675872802734, -0.0011683106422424316, -0.0010894536972045898, -0.001010596752166748, -0.0009317398071289062, -0.0008528828620910645, -0.0007740259170532227, -0.0006951689720153809, -0.0006163120269775391, -0.0005374550819396973, -0.00045859813690185547, -0.00037974119186401367, -0.0003008842468261719, -0.00022202730178833008, -0.00014317035675048828, -6.431341171264648e-05, 1.4543533325195312e-05, 9.340047836303711e-05, 0.0001722574234008789, 0.0002511143684387207, 0.0003299713134765625, 0.0004088282585144043, 0.0004876852035522461, 0.0005665421485900879, 0.0006453990936279297, 0.0007242560386657715, 0.0008031129837036133, 0.0008819699287414551, 0.0009608268737792969, 0.0010396838188171387, 0.0011185407638549805, 0.0011973977088928223, 0.001276254653930664, 0.0013551115989685059, 0.0014339685440063477, 0.0015128254890441895, 0.0015916824340820312, 0.001670539379119873, 0.0017493963241577148, 0.0018282532691955566, 0.0019071102142333984, 0.0019859671592712402, 0.002064824104309082, 0.002143681049346924, 0.0022225379943847656, 0.0023013949394226074, 0.0023802518844604492, 0.002459108829498291, 0.002537965774536133, 0.0026168227195739746, 0.0026956796646118164, 0.002774536609649658, 0.0028533935546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 7.0, 13.0, 19.0, 23.0, 45.0, 47.0, 95.0, 128.0, 153.0, 258.0, 345.0, 489.0, 748.0, 1074.0, 1608.0, 2326.0, 3561.0, 5740.0, 8773.0, 13919.0, 23266.0, 40024.0, 70654.0, 125302.0, 206549.0, 217522.0, 137177.0, 77002.0, 43610.0, 25560.0, 15348.0, 9558.0, 5995.0, 3784.0, 2524.0, 1702.0, 1060.0, 820.0, 524.0, 379.0, 263.0, 162.0, 133.0, 85.0, 68.0, 39.0, 19.0, 16.0, 14.0, 5.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.34716796875, -17.7568359375, -17.16650390625, -16.576171875, -15.98583984375, -15.3955078125, -14.80517578125, -14.21484375, -13.62451171875, -13.0341796875, -12.44384765625, -11.853515625, -11.26318359375, -10.6728515625, -10.08251953125, -9.4921875, -8.90185546875, -8.3115234375, -7.72119140625, -7.130859375, -6.54052734375, -5.9501953125, -5.35986328125, -4.76953125, -4.17919921875, -3.5888671875, -2.99853515625, -2.408203125, -1.81787109375, -1.2275390625, -0.63720703125, -0.046875, 0.54345703125, 1.1337890625, 1.72412109375, 2.314453125, 2.90478515625, 3.4951171875, 4.08544921875, 4.67578125, 5.26611328125, 5.8564453125, 6.44677734375, 7.037109375, 7.62744140625, 8.2177734375, 8.80810546875, 9.3984375, 9.98876953125, 10.5791015625, 11.16943359375, 11.759765625, 12.35009765625, 12.9404296875, 13.53076171875, 14.12109375, 14.71142578125, 15.3017578125, 15.89208984375, 16.482421875, 17.07275390625, 17.6630859375, 18.25341796875, 18.84375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 9.0, 6.0, 9.0, 10.0, 12.0, 16.0, 24.0, 23.0, 33.0, 28.0, 42.0, 45.0, 56.0, 41.0, 50.0, 68.0, 63.0, 53.0, 54.0, 48.0, 35.0, 50.0, 33.0, 31.0, 17.0, 21.0, 20.0, 21.0, 15.0, 7.0, 14.0, 10.0, 3.0, 6.0, 1.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.57421875, -6.378173828125, -6.18212890625, -5.986083984375, -5.7900390625, -5.593994140625, -5.39794921875, -5.201904296875, -5.005859375, -4.809814453125, -4.61376953125, -4.417724609375, -4.2216796875, -4.025634765625, -3.82958984375, -3.633544921875, -3.4375, -3.241455078125, -3.04541015625, -2.849365234375, -2.6533203125, -2.457275390625, -2.26123046875, -2.065185546875, -1.869140625, -1.673095703125, -1.47705078125, -1.281005859375, -1.0849609375, -0.888916015625, -0.69287109375, -0.496826171875, -0.30078125, -0.104736328125, 0.09130859375, 0.287353515625, 0.4833984375, 0.679443359375, 0.87548828125, 1.071533203125, 1.267578125, 1.463623046875, 1.65966796875, 1.855712890625, 2.0517578125, 2.247802734375, 2.44384765625, 2.639892578125, 2.8359375, 3.031982421875, 3.22802734375, 3.424072265625, 3.6201171875, 3.816162109375, 4.01220703125, 4.208251953125, 4.404296875, 4.600341796875, 4.79638671875, 4.992431640625, 5.1884765625, 5.384521484375, 5.58056640625, 5.776611328125, 5.97265625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 13.0, 12.0, 22.0, 25.0, 37.0, 51.0, 60.0, 85.0, 99.0, 117.0, 96.0, 85.0, 69.0, 73.0, 42.0, 21.0, 25.0, 15.0, 13.0, 12.0, 10.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-118.57764434814453, -114.96800994873047, -111.35836791992188, -107.74873352050781, -104.13909149169922, -100.52945709228516, -96.91981506347656, -93.3101806640625, -89.7005386352539, -86.09090423583984, -82.48126220703125, -78.87162780761719, -75.2619857788086, -71.65235137939453, -68.04270935058594, -64.43307495117188, -60.82343673706055, -57.21379852294922, -53.60416030883789, -49.99452209472656, -46.384883880615234, -42.775245666503906, -39.165611267089844, -35.55596923828125, -31.946332931518555, -28.336694717407227, -24.7270565032959, -21.117420196533203, -17.507781982421875, -13.898143768310547, -10.288505554199219, -6.678867340087891, -3.0692291259765625, 0.5404088497161865, 4.1500468254089355, 7.7596845626831055, 11.369322776794434, 14.978960037231445, 18.588598251342773, 22.1982364654541, 25.80787467956543, 29.417512893676758, 33.02714920043945, 36.63678741455078, 40.24642562866211, 43.85606384277344, 47.465702056884766, 51.075340270996094, 54.68497848510742, 58.29461669921875, 61.90425491333008, 65.5138931274414, 69.12352752685547, 72.73316955566406, 76.34280395507812, 79.95244598388672, 83.56208038330078, 87.17171478271484, 90.78135681152344, 94.3909912109375, 98.0006332397461, 101.61026763916016, 105.21990966796875, 108.82954406738281, 112.4391860961914]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 0.0, 6.0, 5.0, 3.0, 6.0, 3.0, 7.0, 13.0, 9.0, 16.0, 18.0, 24.0, 15.0, 33.0, 22.0, 26.0, 39.0, 35.0, 32.0, 40.0, 34.0, 34.0, 47.0, 38.0, 48.0, 40.0, 45.0, 41.0, 30.0, 30.0, 35.0, 30.0, 27.0, 19.0, 18.0, 18.0, 19.0, 10.0, 19.0, 10.0, 9.0, 14.0, 6.0, 3.0, 6.0, 1.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-57.111000061035156, -55.35655975341797, -53.60212326049805, -51.84768295288086, -50.09324645996094, -48.33880615234375, -46.58436584472656, -44.82992935180664, -43.07549285888672, -41.32105255126953, -39.56661605834961, -37.81217575073242, -36.0577392578125, -34.30329895019531, -32.548858642578125, -30.794422149658203, -29.039981842041016, -27.28554344177246, -25.531105041503906, -23.77666473388672, -22.022228240966797, -20.26778793334961, -18.513349533081055, -16.7589111328125, -15.004472732543945, -13.25003433227539, -11.495595932006836, -9.741156578063965, -7.98671817779541, -6.2322797775268555, -4.477840423583984, -2.7234020233154297, -0.9689598083496094, 0.7854788303375244, 2.539917469024658, 4.294356346130371, 6.048794746398926, 7.8032331466674805, 9.557672500610352, 11.312110900878906, 13.066549301147461, 14.820987701416016, 16.57542610168457, 18.329864501953125, 20.084304809570312, 21.838741302490234, 23.593181610107422, 25.347620010375977, 27.10205841064453, 28.856496810913086, 30.61093521118164, 32.36537551879883, 34.11981201171875, 35.87425231933594, 37.628692626953125, 39.38312911987305, 41.13756561279297, 42.892005920410156, 44.64644241333008, 46.400882720947266, 48.15531921386719, 49.909759521484375, 51.66419982910156, 53.418636322021484, 55.17307662963867]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 16.0, 16.0, 32.0, 36.0, 49.0, 73.0, 97.0, 135.0, 211.0, 286.0, 393.0, 638.0, 900.0, 1351.0, 1990.0, 3004.0, 4795.0, 7559.0, 12518.0, 21141.0, 37572.0, 70918.0, 163143.0, 560551.0, 1619468.0, 1130163.0, 318665.0, 112459.0, 53638.0, 28960.0, 16505.0, 9773.0, 6069.0, 3795.0, 2525.0, 1560.0, 1126.0, 726.0, 471.0, 320.0, 225.0, 150.0, 92.0, 59.0, 36.0, 22.0, 14.0, 12.0, 4.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-77.125, -74.6982421875, -72.271484375, -69.8447265625, -67.41796875, -64.9912109375, -62.564453125, -60.1376953125, -57.7109375, -55.2841796875, -52.857421875, -50.4306640625, -48.00390625, -45.5771484375, -43.150390625, -40.7236328125, -38.296875, -35.8701171875, -33.443359375, -31.0166015625, -28.58984375, -26.1630859375, -23.736328125, -21.3095703125, -18.8828125, -16.4560546875, -14.029296875, -11.6025390625, -9.17578125, -6.7490234375, -4.322265625, -1.8955078125, 0.53125, 2.9580078125, 5.384765625, 7.8115234375, 10.23828125, 12.6650390625, 15.091796875, 17.5185546875, 19.9453125, 22.3720703125, 24.798828125, 27.2255859375, 29.65234375, 32.0791015625, 34.505859375, 36.9326171875, 39.359375, 41.7861328125, 44.212890625, 46.6396484375, 49.06640625, 51.4931640625, 53.919921875, 56.3466796875, 58.7734375, 61.2001953125, 63.626953125, 66.0537109375, 68.48046875, 70.9072265625, 73.333984375, 75.7607421875, 78.1875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 3.0, 6.0, 5.0, 15.0, 11.0, 10.0, 13.0, 21.0, 23.0, 20.0, 39.0, 23.0, 24.0, 30.0, 47.0, 29.0, 39.0, 38.0, 51.0, 41.0, 47.0, 43.0, 32.0, 39.0, 51.0, 35.0, 32.0, 26.0, 22.0, 34.0, 19.0, 21.0, 13.0, 11.0, 14.0, 6.0, 14.0, 9.0, 8.0, 1.0, 3.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-41.5625, -40.2880859375, -39.013671875, -37.7392578125, -36.46484375, -35.1904296875, -33.916015625, -32.6416015625, -31.3671875, -30.0927734375, -28.818359375, -27.5439453125, -26.26953125, -24.9951171875, -23.720703125, -22.4462890625, -21.171875, -19.8974609375, -18.623046875, -17.3486328125, -16.07421875, -14.7998046875, -13.525390625, -12.2509765625, -10.9765625, -9.7021484375, -8.427734375, -7.1533203125, -5.87890625, -4.6044921875, -3.330078125, -2.0556640625, -0.78125, 0.4931640625, 1.767578125, 3.0419921875, 4.31640625, 5.5908203125, 6.865234375, 8.1396484375, 9.4140625, 10.6884765625, 11.962890625, 13.2373046875, 14.51171875, 15.7861328125, 17.060546875, 18.3349609375, 19.609375, 20.8837890625, 22.158203125, 23.4326171875, 24.70703125, 25.9814453125, 27.255859375, 28.5302734375, 29.8046875, 31.0791015625, 32.353515625, 33.6279296875, 34.90234375, 36.1767578125, 37.451171875, 38.7255859375, 40.0]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 6.0, 22.0, 44.0, 50.0, 45.0, 112.0, 149.0, 241.0, 421.0, 634.0, 1011.0, 1682.0, 2706.0, 4563.0, 7833.0, 13554.0, 23477.0, 42373.0, 79959.0, 155866.0, 333833.0, 861504.0, 1540961.0, 601759.0, 252917.0, 122352.0, 64258.0, 35007.0, 19596.0, 11293.0, 6419.0, 3826.0, 2278.0, 1387.0, 856.0, 499.0, 306.0, 181.0, 110.0, 71.0, 35.0, 22.0, 16.0, 19.0, 12.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.875, -61.6201171875, -59.365234375, -57.1103515625, -54.85546875, -52.6005859375, -50.345703125, -48.0908203125, -45.8359375, -43.5810546875, -41.326171875, -39.0712890625, -36.81640625, -34.5615234375, -32.306640625, -30.0517578125, -27.796875, -25.5419921875, -23.287109375, -21.0322265625, -18.77734375, -16.5224609375, -14.267578125, -12.0126953125, -9.7578125, -7.5029296875, -5.248046875, -2.9931640625, -0.73828125, 1.5166015625, 3.771484375, 6.0263671875, 8.28125, 10.5361328125, 12.791015625, 15.0458984375, 17.30078125, 19.5556640625, 21.810546875, 24.0654296875, 26.3203125, 28.5751953125, 30.830078125, 33.0849609375, 35.33984375, 37.5947265625, 39.849609375, 42.1044921875, 44.359375, 46.6142578125, 48.869140625, 51.1240234375, 53.37890625, 55.6337890625, 57.888671875, 60.1435546875, 62.3984375, 64.6533203125, 66.908203125, 69.1630859375, 71.41796875, 73.6728515625, 75.927734375, 78.1826171875, 80.4375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 5.0, 9.0, 8.0, 13.0, 7.0, 11.0, 22.0, 16.0, 24.0, 36.0, 33.0, 50.0, 59.0, 72.0, 109.0, 104.0, 141.0, 163.0, 200.0, 235.0, 275.0, 336.0, 389.0, 278.0, 230.0, 202.0, 163.0, 149.0, 121.0, 89.0, 78.0, 78.0, 65.0, 55.0, 44.0, 27.0, 39.0, 35.0, 16.0, 17.0, 21.0, 10.0, 10.0, 10.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-19.4375, -18.8076171875, -18.177734375, -17.5478515625, -16.91796875, -16.2880859375, -15.658203125, -15.0283203125, -14.3984375, -13.7685546875, -13.138671875, -12.5087890625, -11.87890625, -11.2490234375, -10.619140625, -9.9892578125, -9.359375, -8.7294921875, -8.099609375, -7.4697265625, -6.83984375, -6.2099609375, -5.580078125, -4.9501953125, -4.3203125, -3.6904296875, -3.060546875, -2.4306640625, -1.80078125, -1.1708984375, -0.541015625, 0.0888671875, 0.71875, 1.3486328125, 1.978515625, 2.6083984375, 3.23828125, 3.8681640625, 4.498046875, 5.1279296875, 5.7578125, 6.3876953125, 7.017578125, 7.6474609375, 8.27734375, 8.9072265625, 9.537109375, 10.1669921875, 10.796875, 11.4267578125, 12.056640625, 12.6865234375, 13.31640625, 13.9462890625, 14.576171875, 15.2060546875, 15.8359375, 16.4658203125, 17.095703125, 17.7255859375, 18.35546875, 18.9853515625, 19.615234375, 20.2451171875, 20.875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 3.0, 12.0, 9.0, 16.0, 19.0, 30.0, 33.0, 38.0, 38.0, 43.0, 50.0, 67.0, 71.0, 62.0, 75.0, 63.0, 71.0, 43.0, 52.0, 33.0, 36.0, 15.0, 20.0, 20.0, 12.0, 7.0, 8.0, 11.0, 8.0, 4.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.30702209472656, -55.384098052978516, -53.46117401123047, -51.538246154785156, -49.61532211303711, -47.69239807128906, -45.769474029541016, -43.84654998779297, -41.92362594604492, -40.000701904296875, -38.07777786254883, -36.15485382080078, -34.23192596435547, -32.30900192260742, -30.386077880859375, -28.463153839111328, -26.54022789001465, -24.6173038482666, -22.694377899169922, -20.771453857421875, -18.848529815673828, -16.92560577392578, -15.002679824829102, -13.079755783081055, -11.156830787658691, -9.233905792236328, -7.310981750488281, -5.388056755065918, -3.465132236480713, -1.5422077178955078, 0.38071727752685547, 2.3036413192749023, 4.226566314697266, 6.149490833282471, 8.072415351867676, 9.995340347290039, 11.918264389038086, 13.84118938446045, 15.764114379882812, 17.68703842163086, 19.609962463378906, 21.532886505126953, 23.455812454223633, 25.37873649597168, 27.301660537719727, 29.224586486816406, 31.147510528564453, 33.0704345703125, 34.99336242675781, 36.91628646850586, 38.839210510253906, 40.76213836669922, 42.685062408447266, 44.60798645019531, 46.53091049194336, 48.453834533691406, 50.37675857543945, 52.2996826171875, 54.22260665893555, 56.145530700683594, 58.068458557128906, 59.99138259887695, 61.914306640625, 63.83723068237305, 65.7601547241211]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 6.0, 11.0, 18.0, 18.0, 13.0, 24.0, 20.0, 24.0, 27.0, 38.0, 37.0, 36.0, 45.0, 51.0, 42.0, 38.0, 54.0, 40.0, 36.0, 42.0, 54.0, 31.0, 32.0, 38.0, 24.0, 21.0, 26.0, 25.0, 12.0, 19.0, 18.0, 10.0, 11.0, 9.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.858299255371094, -49.344215393066406, -47.830135345458984, -46.3160514831543, -44.801971435546875, -43.28788757324219, -41.7738037109375, -40.25972366333008, -38.745643615722656, -37.23155975341797, -35.71747970581055, -34.20339584350586, -32.68931579589844, -31.17523193359375, -29.661149978637695, -28.14706802368164, -26.632984161376953, -25.1189022064209, -23.604820251464844, -22.090736389160156, -20.576656341552734, -19.062572479248047, -17.548490524291992, -16.034408569335938, -14.520326614379883, -13.006244659423828, -11.492162704467773, -9.978079795837402, -8.463997840881348, -6.949915885925293, -5.435832977294922, -3.921751022338867, -2.407672882080078, -0.8935906887054443, 0.6204915046691895, 2.1345739364624023, 3.648655891418457, 5.162737846374512, 6.676820755004883, 8.190902709960938, 9.704984664916992, 11.219066619873047, 12.733148574829102, 14.247231483459473, 15.761313438415527, 17.275394439697266, 18.789478302001953, 20.303560256958008, 21.817642211914062, 23.331724166870117, 24.845806121826172, 26.35988998413086, 27.87397003173828, 29.38805389404297, 30.902135848999023, 32.41621780395508, 33.9302978515625, 35.44438171386719, 36.95846176147461, 38.4725456237793, 39.98662567138672, 41.500709533691406, 43.014793395996094, 44.528873443603516, 46.0429573059082]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 8.0, 21.0, 21.0, 23.0, 48.0, 78.0, 113.0, 189.0, 224.0, 338.0, 519.0, 790.0, 1350.0, 1957.0, 3063.0, 4528.0, 7627.0, 12342.0, 20637.0, 35370.0, 61580.0, 108851.0, 192780.0, 241600.0, 150328.0, 84377.0, 48605.0, 28015.0, 16262.0, 9853.0, 6164.0, 3791.0, 2436.0, 1561.0, 1052.0, 683.0, 475.0, 337.0, 178.0, 116.0, 94.0, 63.0, 31.0, 25.0, 18.0, 14.0, 11.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-91.875, -89.1142578125, -86.353515625, -83.5927734375, -80.83203125, -78.0712890625, -75.310546875, -72.5498046875, -69.7890625, -67.0283203125, -64.267578125, -61.5068359375, -58.74609375, -55.9853515625, -53.224609375, -50.4638671875, -47.703125, -44.9423828125, -42.181640625, -39.4208984375, -36.66015625, -33.8994140625, -31.138671875, -28.3779296875, -25.6171875, -22.8564453125, -20.095703125, -17.3349609375, -14.57421875, -11.8134765625, -9.052734375, -6.2919921875, -3.53125, -0.7705078125, 1.990234375, 4.7509765625, 7.51171875, 10.2724609375, 13.033203125, 15.7939453125, 18.5546875, 21.3154296875, 24.076171875, 26.8369140625, 29.59765625, 32.3583984375, 35.119140625, 37.8798828125, 40.640625, 43.4013671875, 46.162109375, 48.9228515625, 51.68359375, 54.4443359375, 57.205078125, 59.9658203125, 62.7265625, 65.4873046875, 68.248046875, 71.0087890625, 73.76953125, 76.5302734375, 79.291015625, 82.0517578125, 84.8125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 5.0, 8.0, 8.0, 13.0, 15.0, 20.0, 11.0, 27.0, 28.0, 26.0, 39.0, 38.0, 43.0, 43.0, 48.0, 42.0, 45.0, 40.0, 51.0, 42.0, 44.0, 52.0, 42.0, 25.0, 36.0, 37.0, 24.0, 17.0, 24.0, 16.0, 20.0, 20.0, 9.0, 4.0, 6.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.40625, -46.970703125, -45.53515625, -44.099609375, -42.6640625, -41.228515625, -39.79296875, -38.357421875, -36.921875, -35.486328125, -34.05078125, -32.615234375, -31.1796875, -29.744140625, -28.30859375, -26.873046875, -25.4375, -24.001953125, -22.56640625, -21.130859375, -19.6953125, -18.259765625, -16.82421875, -15.388671875, -13.953125, -12.517578125, -11.08203125, -9.646484375, -8.2109375, -6.775390625, -5.33984375, -3.904296875, -2.46875, -1.033203125, 0.40234375, 1.837890625, 3.2734375, 4.708984375, 6.14453125, 7.580078125, 9.015625, 10.451171875, 11.88671875, 13.322265625, 14.7578125, 16.193359375, 17.62890625, 19.064453125, 20.5, 21.935546875, 23.37109375, 24.806640625, 26.2421875, 27.677734375, 29.11328125, 30.548828125, 31.984375, 33.419921875, 34.85546875, 36.291015625, 37.7265625, 39.162109375, 40.59765625, 42.033203125, 43.46875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 8.0, 7.0, 29.0, 25.0, 36.0, 47.0, 59.0, 82.0, 96.0, 149.0, 241.0, 370.0, 542.0, 787.0, 1130.0, 1924.0, 2850.0, 4670.0, 7648.0, 13094.0, 23282.0, 43363.0, 88525.0, 204858.0, 335954.0, 161347.0, 72189.0, 36215.0, 19474.0, 11242.0, 6723.0, 4017.0, 2615.0, 1654.0, 1033.0, 727.0, 489.0, 344.0, 239.0, 146.0, 111.0, 73.0, 46.0, 29.0, 23.0, 17.0, 11.0, 5.0, 3.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-112.375, -108.7919921875, -105.208984375, -101.6259765625, -98.04296875, -94.4599609375, -90.876953125, -87.2939453125, -83.7109375, -80.1279296875, -76.544921875, -72.9619140625, -69.37890625, -65.7958984375, -62.212890625, -58.6298828125, -55.046875, -51.4638671875, -47.880859375, -44.2978515625, -40.71484375, -37.1318359375, -33.548828125, -29.9658203125, -26.3828125, -22.7998046875, -19.216796875, -15.6337890625, -12.05078125, -8.4677734375, -4.884765625, -1.3017578125, 2.28125, 5.8642578125, 9.447265625, 13.0302734375, 16.61328125, 20.1962890625, 23.779296875, 27.3623046875, 30.9453125, 34.5283203125, 38.111328125, 41.6943359375, 45.27734375, 48.8603515625, 52.443359375, 56.0263671875, 59.609375, 63.1923828125, 66.775390625, 70.3583984375, 73.94140625, 77.5244140625, 81.107421875, 84.6904296875, 88.2734375, 91.8564453125, 95.439453125, 99.0224609375, 102.60546875, 106.1884765625, 109.771484375, 113.3544921875, 116.9375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 4.0, 9.0, 13.0, 8.0, 12.0, 19.0, 18.0, 16.0, 24.0, 32.0, 26.0, 31.0, 34.0, 32.0, 41.0, 43.0, 61.0, 38.0, 41.0, 47.0, 46.0, 37.0, 37.0, 47.0, 28.0, 28.0, 22.0, 34.0, 28.0, 18.0, 19.0, 23.0, 15.0, 9.0, 12.0, 10.0, 8.0, 3.0, 4.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.234375, -30.186767578125, -29.13916015625, -28.091552734375, -27.0439453125, -25.996337890625, -24.94873046875, -23.901123046875, -22.853515625, -21.805908203125, -20.75830078125, -19.710693359375, -18.6630859375, -17.615478515625, -16.56787109375, -15.520263671875, -14.47265625, -13.425048828125, -12.37744140625, -11.329833984375, -10.2822265625, -9.234619140625, -8.18701171875, -7.139404296875, -6.091796875, -5.044189453125, -3.99658203125, -2.948974609375, -1.9013671875, -0.853759765625, 0.19384765625, 1.241455078125, 2.2890625, 3.336669921875, 4.38427734375, 5.431884765625, 6.4794921875, 7.527099609375, 8.57470703125, 9.622314453125, 10.669921875, 11.717529296875, 12.76513671875, 13.812744140625, 14.8603515625, 15.907958984375, 16.95556640625, 18.003173828125, 19.05078125, 20.098388671875, 21.14599609375, 22.193603515625, 23.2412109375, 24.288818359375, 25.33642578125, 26.384033203125, 27.431640625, 28.479248046875, 29.52685546875, 30.574462890625, 31.6220703125, 32.669677734375, 33.71728515625, 34.764892578125, 35.8125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 6.0, 8.0, 18.0, 14.0, 20.0, 24.0, 38.0, 41.0, 60.0, 62.0, 81.0, 118.0, 143.0, 222.0, 304.0, 477.0, 764.0, 1324.0, 2672.0, 6039.0, 16609.0, 79438.0, 717217.0, 179517.0, 26755.0, 8286.0, 3492.0, 1826.0, 1043.0, 587.0, 399.0, 267.0, 177.0, 140.0, 83.0, 75.0, 57.0, 34.0, 27.0, 21.0, 16.0, 13.0, 5.0, 9.0, 7.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.3125, -75.759765625, -73.20703125, -70.654296875, -68.1015625, -65.548828125, -62.99609375, -60.443359375, -57.890625, -55.337890625, -52.78515625, -50.232421875, -47.6796875, -45.126953125, -42.57421875, -40.021484375, -37.46875, -34.916015625, -32.36328125, -29.810546875, -27.2578125, -24.705078125, -22.15234375, -19.599609375, -17.046875, -14.494140625, -11.94140625, -9.388671875, -6.8359375, -4.283203125, -1.73046875, 0.822265625, 3.375, 5.927734375, 8.48046875, 11.033203125, 13.5859375, 16.138671875, 18.69140625, 21.244140625, 23.796875, 26.349609375, 28.90234375, 31.455078125, 34.0078125, 36.560546875, 39.11328125, 41.666015625, 44.21875, 46.771484375, 49.32421875, 51.876953125, 54.4296875, 56.982421875, 59.53515625, 62.087890625, 64.640625, 67.193359375, 69.74609375, 72.298828125, 74.8515625, 77.404296875, 79.95703125, 82.509765625, 85.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 8.0, 14.0, 20.0, 37.0, 92.0, 232.0, 316.0, 142.0, 63.0, 28.0, 9.0, 7.0, 10.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01021575927734375, -0.009941577911376953, -0.009667396545410156, -0.00939321517944336, -0.009119033813476562, -0.008844852447509766, -0.008570671081542969, -0.008296489715576172, -0.008022308349609375, -0.007748126983642578, -0.007473945617675781, -0.007199764251708984, -0.0069255828857421875, -0.006651401519775391, -0.006377220153808594, -0.006103038787841797, -0.005828857421875, -0.005554676055908203, -0.005280494689941406, -0.005006313323974609, -0.0047321319580078125, -0.004457950592041016, -0.004183769226074219, -0.003909587860107422, -0.003635406494140625, -0.003361225128173828, -0.0030870437622070312, -0.0028128623962402344, -0.0025386810302734375, -0.0022644996643066406, -0.0019903182983398438, -0.0017161369323730469, -0.00144195556640625, -0.0011677742004394531, -0.0008935928344726562, -0.0006194114685058594, -0.0003452301025390625, -7.104873657226562e-05, 0.00020313262939453125, 0.0004773139953613281, 0.000751495361328125, 0.0010256767272949219, 0.0012998580932617188, 0.0015740394592285156, 0.0018482208251953125, 0.0021224021911621094, 0.0023965835571289062, 0.002670764923095703, 0.0029449462890625, 0.003219127655029297, 0.0034933090209960938, 0.0037674903869628906, 0.0040416717529296875, 0.004315853118896484, 0.004590034484863281, 0.004864215850830078, 0.005138397216796875, 0.005412578582763672, 0.005686759948730469, 0.005960941314697266, 0.0062351226806640625, 0.006509304046630859, 0.006783485412597656, 0.007057666778564453, 0.00733184814453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 2.0, 7.0, 6.0, 8.0, 12.0, 17.0, 15.0, 23.0, 47.0, 50.0, 89.0, 107.0, 183.0, 270.0, 395.0, 632.0, 1040.0, 1712.0, 2920.0, 5096.0, 10367.0, 26470.0, 111332.0, 599301.0, 219077.0, 40359.0, 13771.0, 6276.0, 3486.0, 2012.0, 1241.0, 727.0, 454.0, 344.0, 253.0, 154.0, 102.0, 54.0, 47.0, 31.0, 21.0, 13.0, 15.0, 6.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-84.25, -81.95263671875, -79.6552734375, -77.35791015625, -75.060546875, -72.76318359375, -70.4658203125, -68.16845703125, -65.87109375, -63.57373046875, -61.2763671875, -58.97900390625, -56.681640625, -54.38427734375, -52.0869140625, -49.78955078125, -47.4921875, -45.19482421875, -42.8974609375, -40.60009765625, -38.302734375, -36.00537109375, -33.7080078125, -31.41064453125, -29.11328125, -26.81591796875, -24.5185546875, -22.22119140625, -19.923828125, -17.62646484375, -15.3291015625, -13.03173828125, -10.734375, -8.43701171875, -6.1396484375, -3.84228515625, -1.544921875, 0.75244140625, 3.0498046875, 5.34716796875, 7.64453125, 9.94189453125, 12.2392578125, 14.53662109375, 16.833984375, 19.13134765625, 21.4287109375, 23.72607421875, 26.0234375, 28.32080078125, 30.6181640625, 32.91552734375, 35.212890625, 37.51025390625, 39.8076171875, 42.10498046875, 44.40234375, 46.69970703125, 48.9970703125, 51.29443359375, 53.591796875, 55.88916015625, 58.1865234375, 60.48388671875, 62.78125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 5.0, 11.0, 10.0, 11.0, 18.0, 29.0, 48.0, 76.0, 131.0, 151.0, 144.0, 101.0, 90.0, 43.0, 31.0, 22.0, 13.0, 6.0, 9.0, 6.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.3778076171875, -12.794677734375, -12.2115478515625, -11.62841796875, -11.0452880859375, -10.462158203125, -9.8790283203125, -9.2958984375, -8.7127685546875, -8.129638671875, -7.5465087890625, -6.96337890625, -6.3802490234375, -5.797119140625, -5.2139892578125, -4.630859375, -4.0477294921875, -3.464599609375, -2.8814697265625, -2.29833984375, -1.7152099609375, -1.132080078125, -0.5489501953125, 0.0341796875, 0.6173095703125, 1.200439453125, 1.7835693359375, 2.36669921875, 2.9498291015625, 3.532958984375, 4.1160888671875, 4.69921875, 5.2823486328125, 5.865478515625, 6.4486083984375, 7.03173828125, 7.6148681640625, 8.197998046875, 8.7811279296875, 9.3642578125, 9.9473876953125, 10.530517578125, 11.1136474609375, 11.69677734375, 12.2799072265625, 12.863037109375, 13.4461669921875, 14.029296875, 14.6124267578125, 15.195556640625, 15.7786865234375, 16.36181640625, 16.9449462890625, 17.528076171875, 18.1112060546875, 18.6943359375, 19.2774658203125, 19.860595703125, 20.4437255859375, 21.02685546875, 21.6099853515625, 22.193115234375, 22.7762451171875, 23.359375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 8.0, 4.0, 8.0, 14.0, 15.0, 19.0, 33.0, 35.0, 46.0, 36.0, 48.0, 55.0, 61.0, 62.0, 59.0, 66.0, 53.0, 55.0, 45.0, 42.0, 28.0, 30.0, 32.0, 22.0, 21.0, 12.0, 16.0, 11.0, 10.0, 3.0, 5.0, 5.0, 3.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.002079010009766, -41.50918960571289, -40.016300201416016, -38.523406982421875, -37.030517578125, -35.537628173828125, -34.04473876953125, -32.551849365234375, -31.058958053588867, -29.566068649291992, -28.073177337646484, -26.58028793334961, -25.087398529052734, -23.594507217407227, -22.10161781311035, -20.608726501464844, -19.11583709716797, -17.622947692871094, -16.130056381225586, -14.637166976928711, -13.14427661895752, -11.651386260986328, -10.158496856689453, -8.665606498718262, -7.17271614074707, -5.679825782775879, -4.186935901641846, -2.6940460205078125, -1.201155662536621, 0.2917346954345703, 1.7846240997314453, 3.2775144577026367, 4.770404815673828, 6.2632951736450195, 7.756185054779053, 9.249074935913086, 10.741965293884277, 12.234855651855469, 13.727745056152344, 15.220635414123535, 16.713525772094727, 18.2064151763916, 19.69930648803711, 21.192195892333984, 22.68508529663086, 24.177976608276367, 25.670866012573242, 27.16375732421875, 28.656646728515625, 30.1495361328125, 31.642427444458008, 33.13531494140625, 34.62820816040039, 36.121097564697266, 37.61398696899414, 39.106876373291016, 40.599769592285156, 42.09265899658203, 43.585548400878906, 45.07843780517578, 46.57133102416992, 48.0642204284668, 49.55710983276367, 51.04999923706055, 52.54288864135742]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 4.0, 7.0, 10.0, 13.0, 17.0, 15.0, 14.0, 13.0, 25.0, 22.0, 30.0, 25.0, 43.0, 47.0, 50.0, 32.0, 30.0, 40.0, 38.0, 48.0, 57.0, 38.0, 40.0, 36.0, 35.0, 26.0, 27.0, 26.0, 28.0, 21.0, 17.0, 18.0, 20.0, 13.0, 13.0, 9.0, 8.0, 6.0, 7.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-44.74073791503906, -43.462337493896484, -42.18394088745117, -40.905540466308594, -39.627140045166016, -38.34873962402344, -37.070343017578125, -35.79194259643555, -34.51354217529297, -33.23514175415039, -31.956743240356445, -30.6783447265625, -29.399944305419922, -28.121545791625977, -26.84314727783203, -25.564746856689453, -24.28635025024414, -23.007951736450195, -21.729551315307617, -20.451152801513672, -19.172752380371094, -17.89435386657715, -16.615955352783203, -15.337555885314941, -14.05915641784668, -12.780756950378418, -11.502357482910156, -10.223958969116211, -8.94555950164795, -7.6671600341796875, -6.388761043548584, -5.1103620529174805, -3.8319664001464844, -2.5535671710968018, -1.2751679420471191, 0.0032312870025634766, 1.281630516052246, 2.560029983520508, 3.8384289741516113, 5.116827964782715, 6.395227432250977, 7.673626899719238, 8.9520263671875, 10.230424880981445, 11.508824348449707, 12.787223815917969, 14.065622329711914, 15.344021797180176, 16.622421264648438, 17.900819778442383, 19.17922019958496, 20.457618713378906, 21.736019134521484, 23.01441764831543, 24.292816162109375, 25.571216583251953, 26.8496150970459, 28.128013610839844, 29.406414031982422, 30.684812545776367, 31.963211059570312, 33.24161148071289, 34.52001190185547, 35.79840850830078, 37.07680892944336]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 13.0, 10.0, 16.0, 28.0, 43.0, 48.0, 67.0, 146.0, 216.0, 326.0, 473.0, 708.0, 1058.0, 1579.0, 2557.0, 3953.0, 6163.0, 9856.0, 15872.0, 25872.0, 41218.0, 66957.0, 108330.0, 166545.0, 198222.0, 148217.0, 95088.0, 58839.0, 35885.0, 22316.0, 13767.0, 8713.0, 5455.0, 3497.0, 2256.0, 1481.0, 999.0, 567.0, 398.0, 277.0, 159.0, 125.0, 78.0, 51.0, 35.0, 26.0, 23.0, 10.0, 10.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-50.6875, -49.16796875, -47.6484375, -46.12890625, -44.609375, -43.08984375, -41.5703125, -40.05078125, -38.53125, -37.01171875, -35.4921875, -33.97265625, -32.453125, -30.93359375, -29.4140625, -27.89453125, -26.375, -24.85546875, -23.3359375, -21.81640625, -20.296875, -18.77734375, -17.2578125, -15.73828125, -14.21875, -12.69921875, -11.1796875, -9.66015625, -8.140625, -6.62109375, -5.1015625, -3.58203125, -2.0625, -0.54296875, 0.9765625, 2.49609375, 4.015625, 5.53515625, 7.0546875, 8.57421875, 10.09375, 11.61328125, 13.1328125, 14.65234375, 16.171875, 17.69140625, 19.2109375, 20.73046875, 22.25, 23.76953125, 25.2890625, 26.80859375, 28.328125, 29.84765625, 31.3671875, 32.88671875, 34.40625, 35.92578125, 37.4453125, 38.96484375, 40.484375, 42.00390625, 43.5234375, 45.04296875, 46.5625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 2.0, 6.0, 3.0, 6.0, 3.0, 4.0, 8.0, 11.0, 15.0, 17.0, 14.0, 17.0, 22.0, 22.0, 29.0, 30.0, 44.0, 50.0, 45.0, 32.0, 47.0, 35.0, 45.0, 39.0, 48.0, 40.0, 46.0, 43.0, 36.0, 27.0, 32.0, 29.0, 23.0, 26.0, 17.0, 17.0, 16.0, 10.0, 11.0, 7.0, 10.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-45.3125, -44.0087890625, -42.705078125, -41.4013671875, -40.09765625, -38.7939453125, -37.490234375, -36.1865234375, -34.8828125, -33.5791015625, -32.275390625, -30.9716796875, -29.66796875, -28.3642578125, -27.060546875, -25.7568359375, -24.453125, -23.1494140625, -21.845703125, -20.5419921875, -19.23828125, -17.9345703125, -16.630859375, -15.3271484375, -14.0234375, -12.7197265625, -11.416015625, -10.1123046875, -8.80859375, -7.5048828125, -6.201171875, -4.8974609375, -3.59375, -2.2900390625, -0.986328125, 0.3173828125, 1.62109375, 2.9248046875, 4.228515625, 5.5322265625, 6.8359375, 8.1396484375, 9.443359375, 10.7470703125, 12.05078125, 13.3544921875, 14.658203125, 15.9619140625, 17.265625, 18.5693359375, 19.873046875, 21.1767578125, 22.48046875, 23.7841796875, 25.087890625, 26.3916015625, 27.6953125, 28.9990234375, 30.302734375, 31.6064453125, 32.91015625, 34.2138671875, 35.517578125, 36.8212890625, 38.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 12.0, 15.0, 14.0, 19.0, 39.0, 52.0, 77.0, 128.0, 202.0, 278.0, 477.0, 827.0, 1381.0, 2356.0, 4108.0, 7529.0, 13944.0, 26707.0, 51895.0, 102817.0, 199559.0, 272697.0, 176477.0, 89715.0, 45059.0, 23886.0, 12478.0, 6841.0, 3775.0, 2056.0, 1217.0, 689.0, 421.0, 286.0, 170.0, 130.0, 66.0, 46.0, 35.0, 22.0, 17.0, 10.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.3125, -68.8017578125, -66.291015625, -63.7802734375, -61.26953125, -58.7587890625, -56.248046875, -53.7373046875, -51.2265625, -48.7158203125, -46.205078125, -43.6943359375, -41.18359375, -38.6728515625, -36.162109375, -33.6513671875, -31.140625, -28.6298828125, -26.119140625, -23.6083984375, -21.09765625, -18.5869140625, -16.076171875, -13.5654296875, -11.0546875, -8.5439453125, -6.033203125, -3.5224609375, -1.01171875, 1.4990234375, 4.009765625, 6.5205078125, 9.03125, 11.5419921875, 14.052734375, 16.5634765625, 19.07421875, 21.5849609375, 24.095703125, 26.6064453125, 29.1171875, 31.6279296875, 34.138671875, 36.6494140625, 39.16015625, 41.6708984375, 44.181640625, 46.6923828125, 49.203125, 51.7138671875, 54.224609375, 56.7353515625, 59.24609375, 61.7568359375, 64.267578125, 66.7783203125, 69.2890625, 71.7998046875, 74.310546875, 76.8212890625, 79.33203125, 81.8427734375, 84.353515625, 86.8642578125, 89.375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 14.0, 8.0, 13.0, 11.0, 20.0, 22.0, 32.0, 16.0, 32.0, 30.0, 29.0, 49.0, 37.0, 44.0, 28.0, 49.0, 34.0, 42.0, 49.0, 42.0, 45.0, 40.0, 30.0, 37.0, 29.0, 32.0, 28.0, 28.0, 17.0, 12.0, 17.0, 19.0, 9.0, 14.0, 9.0, 6.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.9375, -29.06884765625, -28.2001953125, -27.33154296875, -26.462890625, -25.59423828125, -24.7255859375, -23.85693359375, -22.98828125, -22.11962890625, -21.2509765625, -20.38232421875, -19.513671875, -18.64501953125, -17.7763671875, -16.90771484375, -16.0390625, -15.17041015625, -14.3017578125, -13.43310546875, -12.564453125, -11.69580078125, -10.8271484375, -9.95849609375, -9.08984375, -8.22119140625, -7.3525390625, -6.48388671875, -5.615234375, -4.74658203125, -3.8779296875, -3.00927734375, -2.140625, -1.27197265625, -0.4033203125, 0.46533203125, 1.333984375, 2.20263671875, 3.0712890625, 3.93994140625, 4.80859375, 5.67724609375, 6.5458984375, 7.41455078125, 8.283203125, 9.15185546875, 10.0205078125, 10.88916015625, 11.7578125, 12.62646484375, 13.4951171875, 14.36376953125, 15.232421875, 16.10107421875, 16.9697265625, 17.83837890625, 18.70703125, 19.57568359375, 20.4443359375, 21.31298828125, 22.181640625, 23.05029296875, 23.9189453125, 24.78759765625, 25.65625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 17.0, 23.0, 32.0, 34.0, 54.0, 90.0, 100.0, 143.0, 216.0, 354.0, 463.0, 743.0, 1142.0, 1844.0, 3024.0, 5075.0, 9225.0, 17601.0, 36579.0, 88436.0, 249293.0, 373052.0, 149232.0, 56263.0, 25236.0, 12728.0, 6892.0, 4029.0, 2300.0, 1462.0, 915.0, 591.0, 428.0, 277.0, 178.0, 130.0, 96.0, 85.0, 45.0, 32.0, 24.0, 15.0, 20.0, 10.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-33.21875, -32.18896484375, -31.1591796875, -30.12939453125, -29.099609375, -28.06982421875, -27.0400390625, -26.01025390625, -24.98046875, -23.95068359375, -22.9208984375, -21.89111328125, -20.861328125, -19.83154296875, -18.8017578125, -17.77197265625, -16.7421875, -15.71240234375, -14.6826171875, -13.65283203125, -12.623046875, -11.59326171875, -10.5634765625, -9.53369140625, -8.50390625, -7.47412109375, -6.4443359375, -5.41455078125, -4.384765625, -3.35498046875, -2.3251953125, -1.29541015625, -0.265625, 0.76416015625, 1.7939453125, 2.82373046875, 3.853515625, 4.88330078125, 5.9130859375, 6.94287109375, 7.97265625, 9.00244140625, 10.0322265625, 11.06201171875, 12.091796875, 13.12158203125, 14.1513671875, 15.18115234375, 16.2109375, 17.24072265625, 18.2705078125, 19.30029296875, 20.330078125, 21.35986328125, 22.3896484375, 23.41943359375, 24.44921875, 25.47900390625, 26.5087890625, 27.53857421875, 28.568359375, 29.59814453125, 30.6279296875, 31.65771484375, 32.6875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 1.0, 4.0, 5.0, 11.0, 8.0, 19.0, 19.0, 32.0, 54.0, 90.0, 155.0, 188.0, 154.0, 84.0, 68.0, 45.0, 20.0, 15.0, 16.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.004175961017608643, -0.00402987003326416, -0.0038837790489196777, -0.0037376880645751953, -0.003591597080230713, -0.0034455060958862305, -0.003299415111541748, -0.0031533241271972656, -0.003007233142852783, -0.0028611421585083008, -0.0027150511741638184, -0.002568960189819336, -0.0024228692054748535, -0.002276778221130371, -0.0021306872367858887, -0.0019845962524414062, -0.0018385052680969238, -0.0016924142837524414, -0.001546323299407959, -0.0014002323150634766, -0.0012541413307189941, -0.0011080503463745117, -0.0009619593620300293, -0.0008158683776855469, -0.0006697773933410645, -0.000523686408996582, -0.0003775954246520996, -0.0002315044403076172, -8.541345596313477e-05, 6.0677528381347656e-05, 0.00020676851272583008, 0.0003528594970703125, 0.0004989504814147949, 0.0006450414657592773, 0.0007911324501037598, 0.0009372234344482422, 0.0010833144187927246, 0.001229405403137207, 0.0013754963874816895, 0.0015215873718261719, 0.0016676783561706543, 0.0018137693405151367, 0.001959860324859619, 0.0021059513092041016, 0.002252042293548584, 0.0023981332778930664, 0.002544224262237549, 0.0026903152465820312, 0.0028364062309265137, 0.002982497215270996, 0.0031285881996154785, 0.003274679183959961, 0.0034207701683044434, 0.0035668611526489258, 0.003712952136993408, 0.0038590431213378906, 0.004005134105682373, 0.0041512250900268555, 0.004297316074371338, 0.00444340705871582, 0.004589498043060303, 0.004735589027404785, 0.004881680011749268, 0.00502777099609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 3.0, 4.0, 8.0, 14.0, 11.0, 13.0, 26.0, 30.0, 63.0, 63.0, 114.0, 164.0, 252.0, 389.0, 645.0, 1053.0, 1819.0, 3290.0, 6125.0, 12201.0, 26035.0, 63161.0, 177763.0, 408843.0, 213376.0, 74138.0, 29930.0, 13580.0, 6827.0, 3600.0, 1919.0, 1156.0, 680.0, 445.0, 282.0, 156.0, 117.0, 70.0, 58.0, 41.0, 31.0, 18.0, 12.0, 10.0, 6.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-37.5, -36.38330078125, -35.2666015625, -34.14990234375, -33.033203125, -31.91650390625, -30.7998046875, -29.68310546875, -28.56640625, -27.44970703125, -26.3330078125, -25.21630859375, -24.099609375, -22.98291015625, -21.8662109375, -20.74951171875, -19.6328125, -18.51611328125, -17.3994140625, -16.28271484375, -15.166015625, -14.04931640625, -12.9326171875, -11.81591796875, -10.69921875, -9.58251953125, -8.4658203125, -7.34912109375, -6.232421875, -5.11572265625, -3.9990234375, -2.88232421875, -1.765625, -0.64892578125, 0.4677734375, 1.58447265625, 2.701171875, 3.81787109375, 4.9345703125, 6.05126953125, 7.16796875, 8.28466796875, 9.4013671875, 10.51806640625, 11.634765625, 12.75146484375, 13.8681640625, 14.98486328125, 16.1015625, 17.21826171875, 18.3349609375, 19.45166015625, 20.568359375, 21.68505859375, 22.8017578125, 23.91845703125, 25.03515625, 26.15185546875, 27.2685546875, 28.38525390625, 29.501953125, 30.61865234375, 31.7353515625, 32.85205078125, 33.96875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 10.0, 12.0, 12.0, 14.0, 24.0, 23.0, 26.0, 42.0, 29.0, 40.0, 65.0, 76.0, 63.0, 70.0, 70.0, 73.0, 68.0, 61.0, 41.0, 25.0, 33.0, 23.0, 18.0, 21.0, 11.0, 15.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8125, -7.55615234375, -7.2998046875, -7.04345703125, -6.787109375, -6.53076171875, -6.2744140625, -6.01806640625, -5.76171875, -5.50537109375, -5.2490234375, -4.99267578125, -4.736328125, -4.47998046875, -4.2236328125, -3.96728515625, -3.7109375, -3.45458984375, -3.1982421875, -2.94189453125, -2.685546875, -2.42919921875, -2.1728515625, -1.91650390625, -1.66015625, -1.40380859375, -1.1474609375, -0.89111328125, -0.634765625, -0.37841796875, -0.1220703125, 0.13427734375, 0.390625, 0.64697265625, 0.9033203125, 1.15966796875, 1.416015625, 1.67236328125, 1.9287109375, 2.18505859375, 2.44140625, 2.69775390625, 2.9541015625, 3.21044921875, 3.466796875, 3.72314453125, 3.9794921875, 4.23583984375, 4.4921875, 4.74853515625, 5.0048828125, 5.26123046875, 5.517578125, 5.77392578125, 6.0302734375, 6.28662109375, 6.54296875, 6.79931640625, 7.0556640625, 7.31201171875, 7.568359375, 7.82470703125, 8.0810546875, 8.33740234375, 8.59375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 5.0, 10.0, 11.0, 13.0, 20.0, 20.0, 19.0, 26.0, 37.0, 43.0, 48.0, 42.0, 68.0, 51.0, 49.0, 59.0, 66.0, 58.0, 52.0, 40.0, 38.0, 25.0, 32.0, 23.0, 18.0, 17.0, 18.0, 21.0, 9.0, 9.0, 6.0, 6.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.66911697387695, -39.29092788696289, -37.912742614746094, -36.53455352783203, -35.15636444091797, -33.778175354003906, -32.399986267089844, -31.021800994873047, -29.643611907958984, -28.265422821044922, -26.887235641479492, -25.509048461914062, -24.130859375, -22.752670288085938, -21.374483108520508, -19.996295928955078, -18.618106842041016, -17.239917755126953, -15.861730575561523, -14.483542442321777, -13.105354309082031, -11.727166175842285, -10.348978042602539, -8.970789909362793, -7.592601776123047, -6.214413642883301, -4.836225509643555, -3.4580373764038086, -2.0798492431640625, -0.7016611099243164, 0.6765270233154297, 2.054715156555176, 3.4329071044921875, 4.811095237731934, 6.18928337097168, 7.567471504211426, 8.945659637451172, 10.323847770690918, 11.702035903930664, 13.08022403717041, 14.458412170410156, 15.836600303649902, 17.21478843688965, 18.592975616455078, 19.97116470336914, 21.349353790283203, 22.727540969848633, 24.105728149414062, 25.483917236328125, 26.862106323242188, 28.240293502807617, 29.618480682373047, 30.99666976928711, 32.37485885620117, 33.75304412841797, 35.13123321533203, 36.509422302246094, 37.887611389160156, 39.26580047607422, 40.643985748291016, 42.02217483520508, 43.40036392211914, 44.77854919433594, 46.15673828125, 47.53492736816406]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 5.0, 10.0, 10.0, 8.0, 17.0, 16.0, 16.0, 29.0, 21.0, 24.0, 23.0, 35.0, 31.0, 40.0, 50.0, 51.0, 42.0, 45.0, 46.0, 54.0, 43.0, 46.0, 41.0, 34.0, 35.0, 40.0, 22.0, 25.0, 23.0, 18.0, 25.0, 16.0, 12.0, 10.0, 3.0, 11.0, 8.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.09554672241211, -40.7083854675293, -39.321224212646484, -37.934059143066406, -36.546897888183594, -35.15973663330078, -33.77257537841797, -32.385414123535156, -30.998252868652344, -29.61109161376953, -28.223928451538086, -26.836767196655273, -25.44960594177246, -24.062442779541016, -22.675281524658203, -21.28812026977539, -19.900957107543945, -18.513795852661133, -17.126632690429688, -15.739471435546875, -14.352310180664062, -12.965147972106934, -11.577985763549805, -10.190824508666992, -8.803662300109863, -7.416500568389893, -6.029338836669922, -4.642176628112793, -3.2550148963928223, -1.8678531646728516, -0.48069095611572266, 0.9064702987670898, 2.2936325073242188, 3.6807942390441895, 5.06795597076416, 6.455118179321289, 7.84227991104126, 9.22944164276123, 10.61660385131836, 12.003765106201172, 13.3909273147583, 14.77808952331543, 16.165250778198242, 17.552413940429688, 18.9395751953125, 20.326736450195312, 21.713897705078125, 23.101058959960938, 24.488222122192383, 25.875383377075195, 27.26254653930664, 28.649707794189453, 30.036869049072266, 31.424030303955078, 32.811195373535156, 34.19835662841797, 35.58551788330078, 36.972679138183594, 38.359840393066406, 39.74700164794922, 41.1341667175293, 42.52132797241211, 43.90848922729492, 45.295650482177734, 46.68281173706055]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 3.0, 10.0, 13.0, 22.0, 23.0, 48.0, 59.0, 94.0, 135.0, 196.0, 314.0, 445.0, 676.0, 1100.0, 1742.0, 2935.0, 4821.0, 8480.0, 15336.0, 28358.0, 55106.0, 117470.0, 331195.0, 1103656.0, 1549676.0, 609556.0, 192868.0, 81404.0, 40173.0, 21282.0, 11449.0, 6509.0, 3605.0, 2121.0, 1273.0, 731.0, 509.0, 317.0, 216.0, 112.0, 90.0, 46.0, 44.0, 27.0, 12.0, 8.0, 6.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.9375, -58.134765625, -56.33203125, -54.529296875, -52.7265625, -50.923828125, -49.12109375, -47.318359375, -45.515625, -43.712890625, -41.91015625, -40.107421875, -38.3046875, -36.501953125, -34.69921875, -32.896484375, -31.09375, -29.291015625, -27.48828125, -25.685546875, -23.8828125, -22.080078125, -20.27734375, -18.474609375, -16.671875, -14.869140625, -13.06640625, -11.263671875, -9.4609375, -7.658203125, -5.85546875, -4.052734375, -2.25, -0.447265625, 1.35546875, 3.158203125, 4.9609375, 6.763671875, 8.56640625, 10.369140625, 12.171875, 13.974609375, 15.77734375, 17.580078125, 19.3828125, 21.185546875, 22.98828125, 24.791015625, 26.59375, 28.396484375, 30.19921875, 32.001953125, 33.8046875, 35.607421875, 37.41015625, 39.212890625, 41.015625, 42.818359375, 44.62109375, 46.423828125, 48.2265625, 50.029296875, 51.83203125, 53.634765625, 55.4375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 11.0, 6.0, 12.0, 12.0, 17.0, 15.0, 14.0, 26.0, 25.0, 25.0, 31.0, 29.0, 29.0, 39.0, 46.0, 41.0, 34.0, 35.0, 50.0, 27.0, 34.0, 39.0, 54.0, 43.0, 33.0, 31.0, 36.0, 24.0, 14.0, 28.0, 18.0, 11.0, 21.0, 12.0, 19.0, 6.0, 6.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0], "bins": [-34.53125, -33.583251953125, -32.63525390625, -31.687255859375, -30.7392578125, -29.791259765625, -28.84326171875, -27.895263671875, -26.947265625, -25.999267578125, -25.05126953125, -24.103271484375, -23.1552734375, -22.207275390625, -21.25927734375, -20.311279296875, -19.36328125, -18.415283203125, -17.46728515625, -16.519287109375, -15.5712890625, -14.623291015625, -13.67529296875, -12.727294921875, -11.779296875, -10.831298828125, -9.88330078125, -8.935302734375, -7.9873046875, -7.039306640625, -6.09130859375, -5.143310546875, -4.1953125, -3.247314453125, -2.29931640625, -1.351318359375, -0.4033203125, 0.544677734375, 1.49267578125, 2.440673828125, 3.388671875, 4.336669921875, 5.28466796875, 6.232666015625, 7.1806640625, 8.128662109375, 9.07666015625, 10.024658203125, 10.97265625, 11.920654296875, 12.86865234375, 13.816650390625, 14.7646484375, 15.712646484375, 16.66064453125, 17.608642578125, 18.556640625, 19.504638671875, 20.45263671875, 21.400634765625, 22.3486328125, 23.296630859375, 24.24462890625, 25.192626953125, 26.140625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 8.0, 16.0, 24.0, 39.0, 55.0, 68.0, 107.0, 175.0, 254.0, 410.0, 698.0, 1103.0, 1747.0, 2784.0, 4998.0, 8297.0, 15276.0, 28117.0, 53791.0, 110263.0, 241838.0, 597793.0, 1499201.0, 953570.0, 358724.0, 156486.0, 74229.0, 37562.0, 19931.0, 11108.0, 6221.0, 3613.0, 2092.0, 1350.0, 851.0, 535.0, 356.0, 184.0, 131.0, 82.0, 61.0, 47.0, 26.0, 22.0, 16.0, 5.0, 5.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.90625, -49.13427734375, -47.3623046875, -45.59033203125, -43.818359375, -42.04638671875, -40.2744140625, -38.50244140625, -36.73046875, -34.95849609375, -33.1865234375, -31.41455078125, -29.642578125, -27.87060546875, -26.0986328125, -24.32666015625, -22.5546875, -20.78271484375, -19.0107421875, -17.23876953125, -15.466796875, -13.69482421875, -11.9228515625, -10.15087890625, -8.37890625, -6.60693359375, -4.8349609375, -3.06298828125, -1.291015625, 0.48095703125, 2.2529296875, 4.02490234375, 5.796875, 7.56884765625, 9.3408203125, 11.11279296875, 12.884765625, 14.65673828125, 16.4287109375, 18.20068359375, 19.97265625, 21.74462890625, 23.5166015625, 25.28857421875, 27.060546875, 28.83251953125, 30.6044921875, 32.37646484375, 34.1484375, 35.92041015625, 37.6923828125, 39.46435546875, 41.236328125, 43.00830078125, 44.7802734375, 46.55224609375, 48.32421875, 50.09619140625, 51.8681640625, 53.64013671875, 55.412109375, 57.18408203125, 58.9560546875, 60.72802734375, 62.5]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 3.0, 6.0, 4.0, 6.0, 7.0, 12.0, 18.0, 19.0, 23.0, 24.0, 36.0, 56.0, 59.0, 75.0, 78.0, 99.0, 121.0, 142.0, 207.0, 186.0, 251.0, 314.0, 347.0, 291.0, 305.0, 262.0, 210.0, 149.0, 143.0, 120.0, 89.0, 74.0, 60.0, 44.0, 42.0, 42.0, 25.0, 26.0, 28.0, 16.0, 12.0, 8.0, 8.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-14.3671875, -13.8990478515625, -13.430908203125, -12.9627685546875, -12.49462890625, -12.0264892578125, -11.558349609375, -11.0902099609375, -10.6220703125, -10.1539306640625, -9.685791015625, -9.2176513671875, -8.74951171875, -8.2813720703125, -7.813232421875, -7.3450927734375, -6.876953125, -6.4088134765625, -5.940673828125, -5.4725341796875, -5.00439453125, -4.5362548828125, -4.068115234375, -3.5999755859375, -3.1318359375, -2.6636962890625, -2.195556640625, -1.7274169921875, -1.25927734375, -0.7911376953125, -0.322998046875, 0.1451416015625, 0.61328125, 1.0814208984375, 1.549560546875, 2.0177001953125, 2.48583984375, 2.9539794921875, 3.422119140625, 3.8902587890625, 4.3583984375, 4.8265380859375, 5.294677734375, 5.7628173828125, 6.23095703125, 6.6990966796875, 7.167236328125, 7.6353759765625, 8.103515625, 8.5716552734375, 9.039794921875, 9.5079345703125, 9.97607421875, 10.4442138671875, 10.912353515625, 11.3804931640625, 11.8486328125, 12.3167724609375, 12.784912109375, 13.2530517578125, 13.72119140625, 14.1893310546875, 14.657470703125, 15.1256103515625, 15.59375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 6.0, 5.0, 5.0, 11.0, 17.0, 19.0, 24.0, 26.0, 37.0, 43.0, 56.0, 51.0, 63.0, 54.0, 63.0, 59.0, 68.0, 68.0, 52.0, 56.0, 38.0, 33.0, 25.0, 28.0, 24.0, 17.0, 14.0, 5.0, 3.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03245544433594, -38.56648254394531, -37.10050964355469, -35.63453674316406, -34.16856384277344, -32.70259094238281, -31.236618041992188, -29.770645141601562, -28.304672241210938, -26.838699340820312, -25.372726440429688, -23.906753540039062, -22.440780639648438, -20.974807739257812, -19.508834838867188, -18.042861938476562, -16.576889038085938, -15.110916137695312, -13.644943237304688, -12.178970336914062, -10.712997436523438, -9.247024536132812, -7.7810516357421875, -6.3150787353515625, -4.8491058349609375, -3.3831329345703125, -1.9171600341796875, -0.4511871337890625, 1.0147857666015625, 2.4807586669921875, 3.9467315673828125, 5.4127044677734375, 6.878681182861328, 8.344654083251953, 9.810626983642578, 11.276599884033203, 12.742572784423828, 14.208545684814453, 15.674518585205078, 17.140491485595703, 18.606464385986328, 20.072437286376953, 21.538410186767578, 23.004383087158203, 24.470355987548828, 25.936328887939453, 27.402301788330078, 28.868274688720703, 30.334247589111328, 31.800220489501953, 33.26619338989258, 34.7321662902832, 36.19813919067383, 37.66411209106445, 39.13008499145508, 40.5960578918457, 42.06203079223633, 43.52800369262695, 44.99397659301758, 46.4599494934082, 47.92592239379883, 49.39189529418945, 50.85786819458008, 52.3238410949707, 53.78981399536133]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 14.0, 5.0, 8.0, 12.0, 20.0, 23.0, 22.0, 26.0, 28.0, 21.0, 47.0, 28.0, 37.0, 42.0, 41.0, 40.0, 36.0, 40.0, 34.0, 50.0, 44.0, 35.0, 40.0, 37.0, 39.0, 32.0, 24.0, 23.0, 26.0, 20.0, 14.0, 16.0, 10.0, 15.0, 9.0, 9.0, 4.0, 2.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.90105438232422, -34.77497482299805, -33.64889907836914, -32.52281951904297, -31.396739959716797, -30.270662307739258, -29.14458465576172, -28.018505096435547, -26.892427444458008, -25.76634979248047, -24.640270233154297, -23.514192581176758, -22.38811492919922, -21.262035369873047, -20.135957717895508, -19.00988006591797, -17.883800506591797, -16.757722854614258, -15.631643295288086, -14.505565643310547, -13.379487037658691, -12.253408432006836, -11.127330780029297, -10.001252174377441, -8.875173568725586, -7.7490949630737305, -6.623016834259033, -5.496938705444336, -4.3708600997924805, -3.244781494140625, -2.1187033653259277, -0.9926252365112305, 0.13345718383789062, 1.259535551071167, 2.3856139183044434, 3.5116922855377197, 4.637770652770996, 5.763849258422852, 6.889927387237549, 8.016005516052246, 9.142084121704102, 10.268162727355957, 11.394241333007812, 12.520318984985352, 13.646397590637207, 14.772476196289062, 15.898553848266602, 17.02463150024414, 18.150711059570312, 19.27678871154785, 20.402868270874023, 21.528945922851562, 22.655025482177734, 23.781103134155273, 24.907180786132812, 26.033260345458984, 27.159337997436523, 28.285415649414062, 29.411495208740234, 30.537572860717773, 31.663650512695312, 32.789730072021484, 33.915809631347656, 35.04188537597656, 36.167964935302734]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 18.0, 20.0, 24.0, 41.0, 65.0, 76.0, 135.0, 206.0, 346.0, 556.0, 969.0, 1730.0, 3159.0, 5925.0, 11661.0, 23425.0, 51624.0, 123203.0, 305118.0, 301255.0, 120544.0, 50393.0, 23352.0, 11430.0, 5922.0, 3120.0, 1717.0, 936.0, 594.0, 345.0, 190.0, 140.0, 95.0, 55.0, 41.0, 29.0, 30.0, 20.0, 8.0, 7.0, 7.0, 4.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-78.25, -75.55078125, -72.8515625, -70.15234375, -67.453125, -64.75390625, -62.0546875, -59.35546875, -56.65625, -53.95703125, -51.2578125, -48.55859375, -45.859375, -43.16015625, -40.4609375, -37.76171875, -35.0625, -32.36328125, -29.6640625, -26.96484375, -24.265625, -21.56640625, -18.8671875, -16.16796875, -13.46875, -10.76953125, -8.0703125, -5.37109375, -2.671875, 0.02734375, 2.7265625, 5.42578125, 8.125, 10.82421875, 13.5234375, 16.22265625, 18.921875, 21.62109375, 24.3203125, 27.01953125, 29.71875, 32.41796875, 35.1171875, 37.81640625, 40.515625, 43.21484375, 45.9140625, 48.61328125, 51.3125, 54.01171875, 56.7109375, 59.41015625, 62.109375, 64.80859375, 67.5078125, 70.20703125, 72.90625, 75.60546875, 78.3046875, 81.00390625, 83.703125, 86.40234375, 89.1015625, 91.80078125, 94.5]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 12.0, 9.0, 9.0, 4.0, 14.0, 19.0, 18.0, 22.0, 35.0, 28.0, 30.0, 38.0, 36.0, 40.0, 39.0, 44.0, 48.0, 36.0, 42.0, 38.0, 37.0, 50.0, 31.0, 38.0, 49.0, 40.0, 26.0, 23.0, 25.0, 21.0, 19.0, 25.0, 13.0, 9.0, 10.0, 6.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.21875, -35.0673828125, -33.916015625, -32.7646484375, -31.61328125, -30.4619140625, -29.310546875, -28.1591796875, -27.0078125, -25.8564453125, -24.705078125, -23.5537109375, -22.40234375, -21.2509765625, -20.099609375, -18.9482421875, -17.796875, -16.6455078125, -15.494140625, -14.3427734375, -13.19140625, -12.0400390625, -10.888671875, -9.7373046875, -8.5859375, -7.4345703125, -6.283203125, -5.1318359375, -3.98046875, -2.8291015625, -1.677734375, -0.5263671875, 0.625, 1.7763671875, 2.927734375, 4.0791015625, 5.23046875, 6.3818359375, 7.533203125, 8.6845703125, 9.8359375, 10.9873046875, 12.138671875, 13.2900390625, 14.44140625, 15.5927734375, 16.744140625, 17.8955078125, 19.046875, 20.1982421875, 21.349609375, 22.5009765625, 23.65234375, 24.8037109375, 25.955078125, 27.1064453125, 28.2578125, 29.4091796875, 30.560546875, 31.7119140625, 32.86328125, 34.0146484375, 35.166015625, 36.3173828125, 37.46875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 6.0, 4.0, 10.0, 18.0, 34.0, 45.0, 73.0, 81.0, 133.0, 193.0, 301.0, 470.0, 672.0, 1053.0, 1615.0, 2682.0, 4449.0, 7539.0, 13317.0, 24864.0, 49374.0, 112462.0, 291515.0, 305570.0, 120250.0, 52469.0, 25785.0, 13612.0, 7847.0, 4465.0, 2741.0, 1678.0, 1092.0, 672.0, 489.0, 301.0, 217.0, 149.0, 90.0, 62.0, 42.0, 32.0, 24.0, 17.0, 14.0, 10.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-77.0625, -74.5791015625, -72.095703125, -69.6123046875, -67.12890625, -64.6455078125, -62.162109375, -59.6787109375, -57.1953125, -54.7119140625, -52.228515625, -49.7451171875, -47.26171875, -44.7783203125, -42.294921875, -39.8115234375, -37.328125, -34.8447265625, -32.361328125, -29.8779296875, -27.39453125, -24.9111328125, -22.427734375, -19.9443359375, -17.4609375, -14.9775390625, -12.494140625, -10.0107421875, -7.52734375, -5.0439453125, -2.560546875, -0.0771484375, 2.40625, 4.8896484375, 7.373046875, 9.8564453125, 12.33984375, 14.8232421875, 17.306640625, 19.7900390625, 22.2734375, 24.7568359375, 27.240234375, 29.7236328125, 32.20703125, 34.6904296875, 37.173828125, 39.6572265625, 42.140625, 44.6240234375, 47.107421875, 49.5908203125, 52.07421875, 54.5576171875, 57.041015625, 59.5244140625, 62.0078125, 64.4912109375, 66.974609375, 69.4580078125, 71.94140625, 74.4248046875, 76.908203125, 79.3916015625, 81.875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 10.0, 6.0, 5.0, 9.0, 11.0, 15.0, 11.0, 11.0, 13.0, 24.0, 30.0, 20.0, 36.0, 28.0, 34.0, 36.0, 49.0, 43.0, 30.0, 33.0, 54.0, 39.0, 44.0, 42.0, 36.0, 37.0, 39.0, 33.0, 31.0, 25.0, 29.0, 21.0, 23.0, 21.0, 14.0, 12.0, 7.0, 5.0, 5.0, 8.0, 3.0, 7.0, 3.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.109375, -22.376220703125, -21.64306640625, -20.909912109375, -20.1767578125, -19.443603515625, -18.71044921875, -17.977294921875, -17.244140625, -16.510986328125, -15.77783203125, -15.044677734375, -14.3115234375, -13.578369140625, -12.84521484375, -12.112060546875, -11.37890625, -10.645751953125, -9.91259765625, -9.179443359375, -8.4462890625, -7.713134765625, -6.97998046875, -6.246826171875, -5.513671875, -4.780517578125, -4.04736328125, -3.314208984375, -2.5810546875, -1.847900390625, -1.11474609375, -0.381591796875, 0.3515625, 1.084716796875, 1.81787109375, 2.551025390625, 3.2841796875, 4.017333984375, 4.75048828125, 5.483642578125, 6.216796875, 6.949951171875, 7.68310546875, 8.416259765625, 9.1494140625, 9.882568359375, 10.61572265625, 11.348876953125, 12.08203125, 12.815185546875, 13.54833984375, 14.281494140625, 15.0146484375, 15.747802734375, 16.48095703125, 17.214111328125, 17.947265625, 18.680419921875, 19.41357421875, 20.146728515625, 20.8798828125, 21.613037109375, 22.34619140625, 23.079345703125, 23.8125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 10.0, 8.0, 9.0, 14.0, 25.0, 33.0, 27.0, 76.0, 95.0, 135.0, 206.0, 300.0, 502.0, 885.0, 1489.0, 2845.0, 5399.0, 11367.0, 27477.0, 75206.0, 268835.0, 446563.0, 130843.0, 42612.0, 17100.0, 7639.0, 3816.0, 2067.0, 1094.0, 690.0, 412.0, 283.0, 163.0, 103.0, 72.0, 44.0, 40.0, 32.0, 14.0, 10.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-26.375, -25.530517578125, -24.68603515625, -23.841552734375, -22.9970703125, -22.152587890625, -21.30810546875, -20.463623046875, -19.619140625, -18.774658203125, -17.93017578125, -17.085693359375, -16.2412109375, -15.396728515625, -14.55224609375, -13.707763671875, -12.86328125, -12.018798828125, -11.17431640625, -10.329833984375, -9.4853515625, -8.640869140625, -7.79638671875, -6.951904296875, -6.107421875, -5.262939453125, -4.41845703125, -3.573974609375, -2.7294921875, -1.885009765625, -1.04052734375, -0.196044921875, 0.6484375, 1.492919921875, 2.33740234375, 3.181884765625, 4.0263671875, 4.870849609375, 5.71533203125, 6.559814453125, 7.404296875, 8.248779296875, 9.09326171875, 9.937744140625, 10.7822265625, 11.626708984375, 12.47119140625, 13.315673828125, 14.16015625, 15.004638671875, 15.84912109375, 16.693603515625, 17.5380859375, 18.382568359375, 19.22705078125, 20.071533203125, 20.916015625, 21.760498046875, 22.60498046875, 23.449462890625, 24.2939453125, 25.138427734375, 25.98291015625, 26.827392578125, 27.671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 5.0, 8.0, 11.0, 15.0, 22.0, 15.0, 46.0, 46.0, 57.0, 74.0, 90.0, 106.0, 110.0, 78.0, 76.0, 56.0, 46.0, 32.0, 21.0, 18.0, 9.0, 9.0, 9.0, 8.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002593994140625, -0.0025217533111572266, -0.002449512481689453, -0.0023772716522216797, -0.0023050308227539062, -0.002232789993286133, -0.0021605491638183594, -0.002088308334350586, -0.0020160675048828125, -0.001943826675415039, -0.0018715858459472656, -0.0017993450164794922, -0.0017271041870117188, -0.0016548633575439453, -0.0015826225280761719, -0.0015103816986083984, -0.001438140869140625, -0.0013659000396728516, -0.0012936592102050781, -0.0012214183807373047, -0.0011491775512695312, -0.0010769367218017578, -0.0010046958923339844, -0.0009324550628662109, -0.0008602142333984375, -0.0007879734039306641, -0.0007157325744628906, -0.0006434917449951172, -0.0005712509155273438, -0.0004990100860595703, -0.0004267692565917969, -0.00035452842712402344, -0.00028228759765625, -0.00021004676818847656, -0.00013780593872070312, -6.556510925292969e-05, 6.67572021484375e-06, 7.891654968261719e-05, 0.00015115737915039062, 0.00022339820861816406, 0.0002956390380859375, 0.00036787986755371094, 0.0004401206970214844, 0.0005123615264892578, 0.0005846023559570312, 0.0006568431854248047, 0.0007290840148925781, 0.0008013248443603516, 0.000873565673828125, 0.0009458065032958984, 0.0010180473327636719, 0.0010902881622314453, 0.0011625289916992188, 0.0012347698211669922, 0.0013070106506347656, 0.001379251480102539, 0.0014514923095703125, 0.001523733139038086, 0.0015959739685058594, 0.0016682147979736328, 0.0017404556274414062, 0.0018126964569091797, 0.0018849372863769531, 0.0019571781158447266, 0.0020294189453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 3.0, 10.0, 16.0, 15.0, 36.0, 44.0, 48.0, 94.0, 121.0, 209.0, 281.0, 469.0, 693.0, 1132.0, 1913.0, 3295.0, 6165.0, 12607.0, 26493.0, 62347.0, 157100.0, 336697.0, 254709.0, 103027.0, 42064.0, 18765.0, 8950.0, 4600.0, 2602.0, 1457.0, 867.0, 589.0, 334.0, 245.0, 189.0, 128.0, 65.0, 49.0, 35.0, 29.0, 15.0, 17.0, 12.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.15625, -25.358154296875, -24.56005859375, -23.761962890625, -22.9638671875, -22.165771484375, -21.36767578125, -20.569580078125, -19.771484375, -18.973388671875, -18.17529296875, -17.377197265625, -16.5791015625, -15.781005859375, -14.98291015625, -14.184814453125, -13.38671875, -12.588623046875, -11.79052734375, -10.992431640625, -10.1943359375, -9.396240234375, -8.59814453125, -7.800048828125, -7.001953125, -6.203857421875, -5.40576171875, -4.607666015625, -3.8095703125, -3.011474609375, -2.21337890625, -1.415283203125, -0.6171875, 0.180908203125, 0.97900390625, 1.777099609375, 2.5751953125, 3.373291015625, 4.17138671875, 4.969482421875, 5.767578125, 6.565673828125, 7.36376953125, 8.161865234375, 8.9599609375, 9.758056640625, 10.55615234375, 11.354248046875, 12.15234375, 12.950439453125, 13.74853515625, 14.546630859375, 15.3447265625, 16.142822265625, 16.94091796875, 17.739013671875, 18.537109375, 19.335205078125, 20.13330078125, 20.931396484375, 21.7294921875, 22.527587890625, 23.32568359375, 24.123779296875, 24.921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 13.0, 13.0, 18.0, 25.0, 25.0, 41.0, 46.0, 54.0, 80.0, 67.0, 74.0, 66.0, 85.0, 66.0, 58.0, 59.0, 46.0, 40.0, 26.0, 20.0, 16.0, 15.0, 11.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -8.0093994140625, -7.745361328125, -7.4813232421875, -7.21728515625, -6.9532470703125, -6.689208984375, -6.4251708984375, -6.1611328125, -5.8970947265625, -5.633056640625, -5.3690185546875, -5.10498046875, -4.8409423828125, -4.576904296875, -4.3128662109375, -4.048828125, -3.7847900390625, -3.520751953125, -3.2567138671875, -2.99267578125, -2.7286376953125, -2.464599609375, -2.2005615234375, -1.9365234375, -1.6724853515625, -1.408447265625, -1.1444091796875, -0.88037109375, -0.6163330078125, -0.352294921875, -0.0882568359375, 0.17578125, 0.4398193359375, 0.703857421875, 0.9678955078125, 1.23193359375, 1.4959716796875, 1.760009765625, 2.0240478515625, 2.2880859375, 2.5521240234375, 2.816162109375, 3.0802001953125, 3.34423828125, 3.6082763671875, 3.872314453125, 4.1363525390625, 4.400390625, 4.6644287109375, 4.928466796875, 5.1925048828125, 5.45654296875, 5.7205810546875, 5.984619140625, 6.2486572265625, 6.5126953125, 6.7767333984375, 7.040771484375, 7.3048095703125, 7.56884765625, 7.8328857421875, 8.096923828125, 8.3609619140625, 8.625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 6.0, 7.0, 9.0, 9.0, 14.0, 20.0, 10.0, 20.0, 30.0, 42.0, 38.0, 57.0, 48.0, 57.0, 51.0, 70.0, 56.0, 71.0, 58.0, 70.0, 41.0, 37.0, 40.0, 26.0, 27.0, 13.0, 19.0, 11.0, 6.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.675437927246094, -33.38908386230469, -32.102725982666016, -30.816370010375977, -29.530014038085938, -28.2436580657959, -26.95730209350586, -25.67094612121582, -24.38459014892578, -23.098234176635742, -21.811878204345703, -20.525522232055664, -19.239166259765625, -17.952810287475586, -16.666454315185547, -15.380098342895508, -14.093742370605469, -12.80738639831543, -11.52103042602539, -10.234674453735352, -8.948318481445312, -7.661962509155273, -6.375606536865234, -5.089250564575195, -3.8028945922851562, -2.516538619995117, -1.2301826477050781, 0.05617332458496094, 1.342529296875, 2.628885269165039, 3.915241241455078, 5.201597213745117, 6.487953186035156, 7.774309158325195, 9.060665130615234, 10.347021102905273, 11.633377075195312, 12.919733047485352, 14.20608901977539, 15.49244499206543, 16.77880096435547, 18.065156936645508, 19.351512908935547, 20.637868881225586, 21.924224853515625, 23.210580825805664, 24.496936798095703, 25.783292770385742, 27.06964874267578, 28.35600471496582, 29.64236068725586, 30.9287166595459, 32.21507263183594, 33.501426696777344, 34.787784576416016, 36.07414245605469, 37.360496520996094, 38.6468505859375, 39.93320846557617, 41.219566345214844, 42.50592041015625, 43.792274475097656, 45.07863235473633, 46.364990234375, 47.651344299316406]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 10.0, 9.0, 8.0, 14.0, 17.0, 23.0, 27.0, 20.0, 26.0, 34.0, 41.0, 42.0, 26.0, 35.0, 51.0, 40.0, 32.0, 38.0, 43.0, 55.0, 35.0, 44.0, 44.0, 40.0, 28.0, 25.0, 20.0, 25.0, 28.0, 21.0, 19.0, 13.0, 15.0, 7.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.04462432861328, -32.96225357055664, -31.8798828125, -30.797510147094727, -29.715139389038086, -28.632768630981445, -27.550395965576172, -26.46802520751953, -25.38565444946289, -24.30328369140625, -23.22091293334961, -22.138540267944336, -21.056169509887695, -19.973798751831055, -18.89142608642578, -17.80905532836914, -16.7266845703125, -15.64431381225586, -14.561942100524902, -13.479570388793945, -12.397199630737305, -11.314828872680664, -10.232457160949707, -9.15008544921875, -8.06771469116211, -6.9853434562683105, -5.902972221374512, -4.820600986480713, -3.738229751586914, -2.6558585166931152, -1.5734872817993164, -0.4911160469055176, 0.5912551879882812, 1.67362642288208, 2.755997657775879, 3.8383688926696777, 4.920740127563477, 6.003111362457275, 7.085482597351074, 8.167854309082031, 9.250225067138672, 10.332595825195312, 11.41496753692627, 12.497339248657227, 13.579710006713867, 14.662080764770508, 15.744452476501465, 16.826824188232422, 17.909194946289062, 18.991565704345703, 20.073936462402344, 21.156309127807617, 22.238679885864258, 23.3210506439209, 24.403423309326172, 25.485794067382812, 26.568164825439453, 27.650535583496094, 28.732906341552734, 29.815279006958008, 30.89764976501465, 31.98002052307129, 33.06239318847656, 34.1447639465332, 35.227134704589844]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 18.0, 16.0, 33.0, 47.0, 68.0, 103.0, 146.0, 218.0, 378.0, 606.0, 909.0, 1549.0, 2423.0, 4103.0, 6944.0, 12397.0, 21484.0, 37783.0, 67915.0, 119462.0, 188676.0, 213966.0, 155537.0, 92330.0, 52299.0, 29274.0, 16477.0, 9322.0, 5585.0, 3248.0, 1948.0, 1160.0, 741.0, 491.0, 323.0, 199.0, 119.0, 84.0, 54.0, 39.0, 18.0, 16.0, 17.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-53.96875, -52.4384765625, -50.908203125, -49.3779296875, -47.84765625, -46.3173828125, -44.787109375, -43.2568359375, -41.7265625, -40.1962890625, -38.666015625, -37.1357421875, -35.60546875, -34.0751953125, -32.544921875, -31.0146484375, -29.484375, -27.9541015625, -26.423828125, -24.8935546875, -23.36328125, -21.8330078125, -20.302734375, -18.7724609375, -17.2421875, -15.7119140625, -14.181640625, -12.6513671875, -11.12109375, -9.5908203125, -8.060546875, -6.5302734375, -5.0, -3.4697265625, -1.939453125, -0.4091796875, 1.12109375, 2.6513671875, 4.181640625, 5.7119140625, 7.2421875, 8.7724609375, 10.302734375, 11.8330078125, 13.36328125, 14.8935546875, 16.423828125, 17.9541015625, 19.484375, 21.0146484375, 22.544921875, 24.0751953125, 25.60546875, 27.1357421875, 28.666015625, 30.1962890625, 31.7265625, 33.2568359375, 34.787109375, 36.3173828125, 37.84765625, 39.3779296875, 40.908203125, 42.4384765625, 43.96875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 9.0, 9.0, 5.0, 10.0, 16.0, 19.0, 27.0, 28.0, 26.0, 26.0, 38.0, 47.0, 36.0, 43.0, 33.0, 41.0, 44.0, 33.0, 51.0, 51.0, 57.0, 40.0, 55.0, 43.0, 23.0, 27.0, 27.0, 22.0, 16.0, 24.0, 13.0, 12.0, 14.0, 6.0, 4.0, 4.0, 8.0, 1.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.15625, -34.04638671875, -32.9365234375, -31.82666015625, -30.716796875, -29.60693359375, -28.4970703125, -27.38720703125, -26.27734375, -25.16748046875, -24.0576171875, -22.94775390625, -21.837890625, -20.72802734375, -19.6181640625, -18.50830078125, -17.3984375, -16.28857421875, -15.1787109375, -14.06884765625, -12.958984375, -11.84912109375, -10.7392578125, -9.62939453125, -8.51953125, -7.40966796875, -6.2998046875, -5.18994140625, -4.080078125, -2.97021484375, -1.8603515625, -0.75048828125, 0.359375, 1.46923828125, 2.5791015625, 3.68896484375, 4.798828125, 5.90869140625, 7.0185546875, 8.12841796875, 9.23828125, 10.34814453125, 11.4580078125, 12.56787109375, 13.677734375, 14.78759765625, 15.8974609375, 17.00732421875, 18.1171875, 19.22705078125, 20.3369140625, 21.44677734375, 22.556640625, 23.66650390625, 24.7763671875, 25.88623046875, 26.99609375, 28.10595703125, 29.2158203125, 30.32568359375, 31.435546875, 32.54541015625, 33.6552734375, 34.76513671875, 35.875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 9.0, 17.0, 17.0, 41.0, 58.0, 76.0, 134.0, 211.0, 285.0, 484.0, 700.0, 1100.0, 1754.0, 2741.0, 4315.0, 6872.0, 10901.0, 17583.0, 28749.0, 47217.0, 78003.0, 124260.0, 179172.0, 187472.0, 135345.0, 85541.0, 52170.0, 31567.0, 19417.0, 11903.0, 7394.0, 4760.0, 2883.0, 1908.0, 1218.0, 766.0, 537.0, 323.0, 230.0, 138.0, 91.0, 72.0, 38.0, 34.0, 23.0, 7.0, 5.0, 5.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.5, -48.00439453125, -46.5087890625, -45.01318359375, -43.517578125, -42.02197265625, -40.5263671875, -39.03076171875, -37.53515625, -36.03955078125, -34.5439453125, -33.04833984375, -31.552734375, -30.05712890625, -28.5615234375, -27.06591796875, -25.5703125, -24.07470703125, -22.5791015625, -21.08349609375, -19.587890625, -18.09228515625, -16.5966796875, -15.10107421875, -13.60546875, -12.10986328125, -10.6142578125, -9.11865234375, -7.623046875, -6.12744140625, -4.6318359375, -3.13623046875, -1.640625, -0.14501953125, 1.3505859375, 2.84619140625, 4.341796875, 5.83740234375, 7.3330078125, 8.82861328125, 10.32421875, 11.81982421875, 13.3154296875, 14.81103515625, 16.306640625, 17.80224609375, 19.2978515625, 20.79345703125, 22.2890625, 23.78466796875, 25.2802734375, 26.77587890625, 28.271484375, 29.76708984375, 31.2626953125, 32.75830078125, 34.25390625, 35.74951171875, 37.2451171875, 38.74072265625, 40.236328125, 41.73193359375, 43.2275390625, 44.72314453125, 46.21875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 7.0, 4.0, 6.0, 14.0, 20.0, 14.0, 20.0, 16.0, 12.0, 17.0, 19.0, 27.0, 42.0, 39.0, 33.0, 45.0, 33.0, 39.0, 49.0, 49.0, 42.0, 40.0, 40.0, 31.0, 40.0, 34.0, 32.0, 34.0, 25.0, 28.0, 23.0, 22.0, 14.0, 13.0, 19.0, 10.0, 6.0, 5.0, 7.0, 4.0, 9.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.671875, -19.99560546875, -19.3193359375, -18.64306640625, -17.966796875, -17.29052734375, -16.6142578125, -15.93798828125, -15.26171875, -14.58544921875, -13.9091796875, -13.23291015625, -12.556640625, -11.88037109375, -11.2041015625, -10.52783203125, -9.8515625, -9.17529296875, -8.4990234375, -7.82275390625, -7.146484375, -6.47021484375, -5.7939453125, -5.11767578125, -4.44140625, -3.76513671875, -3.0888671875, -2.41259765625, -1.736328125, -1.06005859375, -0.3837890625, 0.29248046875, 0.96875, 1.64501953125, 2.3212890625, 2.99755859375, 3.673828125, 4.35009765625, 5.0263671875, 5.70263671875, 6.37890625, 7.05517578125, 7.7314453125, 8.40771484375, 9.083984375, 9.76025390625, 10.4365234375, 11.11279296875, 11.7890625, 12.46533203125, 13.1416015625, 13.81787109375, 14.494140625, 15.17041015625, 15.8466796875, 16.52294921875, 17.19921875, 17.87548828125, 18.5517578125, 19.22802734375, 19.904296875, 20.58056640625, 21.2568359375, 21.93310546875, 22.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 9.0, 11.0, 16.0, 25.0, 46.0, 60.0, 79.0, 117.0, 177.0, 259.0, 384.0, 605.0, 897.0, 1549.0, 2340.0, 3885.0, 6554.0, 11388.0, 21592.0, 42626.0, 89888.0, 194805.0, 302208.0, 190256.0, 87595.0, 41638.0, 21436.0, 11470.0, 6386.0, 3869.0, 2300.0, 1395.0, 934.0, 590.0, 359.0, 262.0, 166.0, 108.0, 82.0, 48.0, 36.0, 21.0, 30.0, 12.0, 11.0, 3.0, 5.0, 5.0, 0.0, 4.0, 4.0, 0.0, 3.0], "bins": [-18.5, -17.947509765625, -17.39501953125, -16.842529296875, -16.2900390625, -15.737548828125, -15.18505859375, -14.632568359375, -14.080078125, -13.527587890625, -12.97509765625, -12.422607421875, -11.8701171875, -11.317626953125, -10.76513671875, -10.212646484375, -9.66015625, -9.107666015625, -8.55517578125, -8.002685546875, -7.4501953125, -6.897705078125, -6.34521484375, -5.792724609375, -5.240234375, -4.687744140625, -4.13525390625, -3.582763671875, -3.0302734375, -2.477783203125, -1.92529296875, -1.372802734375, -0.8203125, -0.267822265625, 0.28466796875, 0.837158203125, 1.3896484375, 1.942138671875, 2.49462890625, 3.047119140625, 3.599609375, 4.152099609375, 4.70458984375, 5.257080078125, 5.8095703125, 6.362060546875, 6.91455078125, 7.467041015625, 8.01953125, 8.572021484375, 9.12451171875, 9.677001953125, 10.2294921875, 10.781982421875, 11.33447265625, 11.886962890625, 12.439453125, 12.991943359375, 13.54443359375, 14.096923828125, 14.6494140625, 15.201904296875, 15.75439453125, 16.306884765625, 16.859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 8.0, 9.0, 15.0, 17.0, 23.0, 47.0, 56.0, 77.0, 99.0, 146.0, 132.0, 97.0, 68.0, 45.0, 29.0, 32.0, 25.0, 14.0, 12.0, 10.0, 5.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020694732666015625, -0.00199282169342041, -0.0019161701202392578, -0.0018395185470581055, -0.0017628669738769531, -0.0016862154006958008, -0.0016095638275146484, -0.001532912254333496, -0.0014562606811523438, -0.0013796091079711914, -0.001302957534790039, -0.0012263059616088867, -0.0011496543884277344, -0.001073002815246582, -0.0009963512420654297, -0.0009196996688842773, -0.000843048095703125, -0.0007663965225219727, -0.0006897449493408203, -0.000613093376159668, -0.0005364418029785156, -0.0004597902297973633, -0.00038313865661621094, -0.0003064870834350586, -0.00022983551025390625, -0.0001531839370727539, -7.653236389160156e-05, 1.1920928955078125e-07, 7.677078247070312e-05, 0.00015342235565185547, 0.0002300739288330078, 0.00030672550201416016, 0.0003833770751953125, 0.00046002864837646484, 0.0005366802215576172, 0.0006133317947387695, 0.0006899833679199219, 0.0007666349411010742, 0.0008432865142822266, 0.0009199380874633789, 0.0009965896606445312, 0.0010732412338256836, 0.001149892807006836, 0.0012265443801879883, 0.0013031959533691406, 0.001379847526550293, 0.0014564990997314453, 0.0015331506729125977, 0.00160980224609375, 0.0016864538192749023, 0.0017631053924560547, 0.001839756965637207, 0.0019164085388183594, 0.0019930601119995117, 0.002069711685180664, 0.0021463632583618164, 0.0022230148315429688, 0.002299666404724121, 0.0023763179779052734, 0.0024529695510864258, 0.002529621124267578, 0.0026062726974487305, 0.002682924270629883, 0.002759575843811035, 0.0028362274169921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 7.0, 7.0, 15.0, 23.0, 31.0, 42.0, 57.0, 88.0, 153.0, 199.0, 312.0, 559.0, 869.0, 1626.0, 2810.0, 5282.0, 9870.0, 20253.0, 43133.0, 96989.0, 217999.0, 318493.0, 179618.0, 79028.0, 35383.0, 16846.0, 8518.0, 4454.0, 2445.0, 1321.0, 796.0, 490.0, 283.0, 174.0, 119.0, 82.0, 51.0, 24.0, 29.0, 23.0, 14.0, 11.0, 12.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.421875, -17.834716796875, -17.24755859375, -16.660400390625, -16.0732421875, -15.486083984375, -14.89892578125, -14.311767578125, -13.724609375, -13.137451171875, -12.55029296875, -11.963134765625, -11.3759765625, -10.788818359375, -10.20166015625, -9.614501953125, -9.02734375, -8.440185546875, -7.85302734375, -7.265869140625, -6.6787109375, -6.091552734375, -5.50439453125, -4.917236328125, -4.330078125, -3.742919921875, -3.15576171875, -2.568603515625, -1.9814453125, -1.394287109375, -0.80712890625, -0.219970703125, 0.3671875, 0.954345703125, 1.54150390625, 2.128662109375, 2.7158203125, 3.302978515625, 3.89013671875, 4.477294921875, 5.064453125, 5.651611328125, 6.23876953125, 6.825927734375, 7.4130859375, 8.000244140625, 8.58740234375, 9.174560546875, 9.76171875, 10.348876953125, 10.93603515625, 11.523193359375, 12.1103515625, 12.697509765625, 13.28466796875, 13.871826171875, 14.458984375, 15.046142578125, 15.63330078125, 16.220458984375, 16.8076171875, 17.394775390625, 17.98193359375, 18.569091796875, 19.15625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 6.0, 4.0, 8.0, 10.0, 9.0, 21.0, 18.0, 27.0, 22.0, 48.0, 32.0, 36.0, 33.0, 43.0, 56.0, 66.0, 66.0, 76.0, 72.0, 43.0, 50.0, 35.0, 31.0, 29.0, 23.0, 23.0, 15.0, 17.0, 11.0, 16.0, 12.0, 4.0, 5.0, 5.0, 2.0, 0.0, 3.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.6851806640625, -4.550048828125, -4.4149169921875, -4.27978515625, -4.1446533203125, -4.009521484375, -3.8743896484375, -3.7392578125, -3.6041259765625, -3.468994140625, -3.3338623046875, -3.19873046875, -3.0635986328125, -2.928466796875, -2.7933349609375, -2.658203125, -2.5230712890625, -2.387939453125, -2.2528076171875, -2.11767578125, -1.9825439453125, -1.847412109375, -1.7122802734375, -1.5771484375, -1.4420166015625, -1.306884765625, -1.1717529296875, -1.03662109375, -0.9014892578125, -0.766357421875, -0.6312255859375, -0.49609375, -0.3609619140625, -0.225830078125, -0.0906982421875, 0.04443359375, 0.1795654296875, 0.314697265625, 0.4498291015625, 0.5849609375, 0.7200927734375, 0.855224609375, 0.9903564453125, 1.12548828125, 1.2606201171875, 1.395751953125, 1.5308837890625, 1.666015625, 1.8011474609375, 1.936279296875, 2.0714111328125, 2.20654296875, 2.3416748046875, 2.476806640625, 2.6119384765625, 2.7470703125, 2.8822021484375, 3.017333984375, 3.1524658203125, 3.28759765625, 3.4227294921875, 3.557861328125, 3.6929931640625, 3.828125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 7.0, 15.0, 17.0, 21.0, 18.0, 25.0, 22.0, 46.0, 51.0, 50.0, 70.0, 55.0, 73.0, 67.0, 78.0, 55.0, 55.0, 45.0, 41.0, 35.0, 27.0, 29.0, 24.0, 10.0, 16.0, 10.0, 7.0, 6.0, 5.0, 0.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.27734375, -35.90780258178711, -34.53826141357422, -33.16872024536133, -31.799179077148438, -30.429637908935547, -29.060096740722656, -27.690555572509766, -26.321014404296875, -24.951473236083984, -23.581932067871094, -22.212390899658203, -20.842849731445312, -19.473308563232422, -18.10376739501953, -16.73422622680664, -15.36468505859375, -13.99514389038086, -12.625602722167969, -11.256061553955078, -9.886520385742188, -8.516979217529297, -7.147438049316406, -5.777896881103516, -4.408355712890625, -3.0388145446777344, -1.6692733764648438, -0.2997322082519531, 1.0698089599609375, 2.439350128173828, 3.8088912963867188, 5.178432464599609, 6.547977447509766, 7.917518615722656, 9.287059783935547, 10.656600952148438, 12.026142120361328, 13.395683288574219, 14.76522445678711, 16.134765625, 17.50430679321289, 18.87384796142578, 20.243389129638672, 21.612930297851562, 22.982471466064453, 24.352012634277344, 25.721553802490234, 27.091094970703125, 28.460636138916016, 29.830177307128906, 31.199718475341797, 32.56925964355469, 33.93880081176758, 35.30834197998047, 36.67788314819336, 38.04742431640625, 39.41696548461914, 40.78650665283203, 42.15604782104492, 43.52558898925781, 44.8951301574707, 46.264671325683594, 47.634212493896484, 49.003753662109375, 50.373294830322266]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 2.0, 4.0, 6.0, 10.0, 12.0, 10.0, 9.0, 18.0, 19.0, 27.0, 33.0, 23.0, 26.0, 27.0, 34.0, 36.0, 32.0, 46.0, 47.0, 40.0, 29.0, 44.0, 40.0, 43.0, 45.0, 28.0, 32.0, 41.0, 38.0, 25.0, 27.0, 24.0, 13.0, 26.0, 18.0, 12.0, 9.0, 6.0, 7.0, 8.0, 5.0, 9.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-37.34229278564453, -36.2725944519043, -35.20289611816406, -34.13319778442383, -33.063499450683594, -31.993799209594727, -30.924100875854492, -29.854402542114258, -28.78470230102539, -27.715003967285156, -26.645305633544922, -25.575607299804688, -24.50590705871582, -23.436208724975586, -22.36651039123535, -21.296812057495117, -20.227113723754883, -19.15741539001465, -18.087717056274414, -17.018016815185547, -15.948318481445312, -14.878620147705078, -13.808921813964844, -12.73922348022461, -11.669524192810059, -10.599825859069824, -9.530126571655273, -8.460428237915039, -7.3907294273376465, -6.321030616760254, -5.2513322830200195, -4.181633472442627, -3.1119327545166016, -2.042233943939209, -0.9725353717803955, 0.09716320037841797, 1.1668620109558105, 2.236560821533203, 3.3062591552734375, 4.37595796585083, 5.445656776428223, 6.515355587005615, 7.585054397583008, 8.654752731323242, 9.724451065063477, 10.794150352478027, 11.863848686218262, 12.933547973632812, 14.003246307373047, 15.072944641113281, 16.142642974853516, 17.21234130859375, 18.282041549682617, 19.35173988342285, 20.421438217163086, 21.49113655090332, 22.560836791992188, 23.630535125732422, 24.700233459472656, 25.76993179321289, 26.839632034301758, 27.909330368041992, 28.979028701782227, 30.04872703552246, 31.118425369262695]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 11.0, 15.0, 25.0, 30.0, 40.0, 73.0, 131.0, 176.0, 270.0, 404.0, 613.0, 960.0, 1434.0, 2209.0, 3379.0, 5078.0, 7926.0, 12431.0, 20153.0, 33511.0, 59514.0, 119271.0, 311421.0, 838834.0, 1337144.0, 858503.0, 316341.0, 119757.0, 58782.0, 32842.0, 19275.0, 11914.0, 7573.0, 4867.0, 3185.0, 2064.0, 1387.0, 890.0, 565.0, 411.0, 273.0, 200.0, 143.0, 70.0, 57.0, 44.0, 20.0, 19.0, 10.0, 14.0, 11.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-37.8125, -36.57275390625, -35.3330078125, -34.09326171875, -32.853515625, -31.61376953125, -30.3740234375, -29.13427734375, -27.89453125, -26.65478515625, -25.4150390625, -24.17529296875, -22.935546875, -21.69580078125, -20.4560546875, -19.21630859375, -17.9765625, -16.73681640625, -15.4970703125, -14.25732421875, -13.017578125, -11.77783203125, -10.5380859375, -9.29833984375, -8.05859375, -6.81884765625, -5.5791015625, -4.33935546875, -3.099609375, -1.85986328125, -0.6201171875, 0.61962890625, 1.859375, 3.09912109375, 4.3388671875, 5.57861328125, 6.818359375, 8.05810546875, 9.2978515625, 10.53759765625, 11.77734375, 13.01708984375, 14.2568359375, 15.49658203125, 16.736328125, 17.97607421875, 19.2158203125, 20.45556640625, 21.6953125, 22.93505859375, 24.1748046875, 25.41455078125, 26.654296875, 27.89404296875, 29.1337890625, 30.37353515625, 31.61328125, 32.85302734375, 34.0927734375, 35.33251953125, 36.572265625, 37.81201171875, 39.0517578125, 40.29150390625, 41.53125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 10.0, 11.0, 18.0, 15.0, 18.0, 11.0, 24.0, 24.0, 27.0, 33.0, 31.0, 41.0, 33.0, 31.0, 51.0, 41.0, 39.0, 38.0, 40.0, 50.0, 37.0, 33.0, 30.0, 41.0, 31.0, 38.0, 30.0, 29.0, 18.0, 18.0, 17.0, 15.0, 14.0, 12.0, 10.0, 8.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.359375, -27.47021484375, -26.5810546875, -25.69189453125, -24.802734375, -23.91357421875, -23.0244140625, -22.13525390625, -21.24609375, -20.35693359375, -19.4677734375, -18.57861328125, -17.689453125, -16.80029296875, -15.9111328125, -15.02197265625, -14.1328125, -13.24365234375, -12.3544921875, -11.46533203125, -10.576171875, -9.68701171875, -8.7978515625, -7.90869140625, -7.01953125, -6.13037109375, -5.2412109375, -4.35205078125, -3.462890625, -2.57373046875, -1.6845703125, -0.79541015625, 0.09375, 0.98291015625, 1.8720703125, 2.76123046875, 3.650390625, 4.53955078125, 5.4287109375, 6.31787109375, 7.20703125, 8.09619140625, 8.9853515625, 9.87451171875, 10.763671875, 11.65283203125, 12.5419921875, 13.43115234375, 14.3203125, 15.20947265625, 16.0986328125, 16.98779296875, 17.876953125, 18.76611328125, 19.6552734375, 20.54443359375, 21.43359375, 22.32275390625, 23.2119140625, 24.10107421875, 24.990234375, 25.87939453125, 26.7685546875, 27.65771484375, 28.546875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 30.0, 29.0, 43.0, 65.0, 84.0, 174.0, 242.0, 407.0, 668.0, 1123.0, 1861.0, 3152.0, 5618.0, 9926.0, 17822.0, 33271.0, 65933.0, 138641.0, 323027.0, 909416.0, 1632692.0, 601930.0, 232897.0, 104413.0, 50886.0, 26461.0, 14313.0, 7961.0, 4514.0, 2674.0, 1498.0, 940.0, 571.0, 333.0, 238.0, 142.0, 87.0, 55.0, 32.0, 24.0, 20.0, 8.0, 11.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-53.8125, -52.197265625, -50.58203125, -48.966796875, -47.3515625, -45.736328125, -44.12109375, -42.505859375, -40.890625, -39.275390625, -37.66015625, -36.044921875, -34.4296875, -32.814453125, -31.19921875, -29.583984375, -27.96875, -26.353515625, -24.73828125, -23.123046875, -21.5078125, -19.892578125, -18.27734375, -16.662109375, -15.046875, -13.431640625, -11.81640625, -10.201171875, -8.5859375, -6.970703125, -5.35546875, -3.740234375, -2.125, -0.509765625, 1.10546875, 2.720703125, 4.3359375, 5.951171875, 7.56640625, 9.181640625, 10.796875, 12.412109375, 14.02734375, 15.642578125, 17.2578125, 18.873046875, 20.48828125, 22.103515625, 23.71875, 25.333984375, 26.94921875, 28.564453125, 30.1796875, 31.794921875, 33.41015625, 35.025390625, 36.640625, 38.255859375, 39.87109375, 41.486328125, 43.1015625, 44.716796875, 46.33203125, 47.947265625, 49.5625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 8.0, 12.0, 20.0, 30.0, 26.0, 39.0, 52.0, 78.0, 87.0, 139.0, 186.0, 265.0, 282.0, 361.0, 485.0, 442.0, 386.0, 290.0, 208.0, 168.0, 105.0, 93.0, 82.0, 40.0, 36.0, 33.0, 34.0, 23.0, 17.0, 8.0, 8.0, 7.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.75, -20.171875, -19.59375, -19.015625, -18.4375, -17.859375, -17.28125, -16.703125, -16.125, -15.546875, -14.96875, -14.390625, -13.8125, -13.234375, -12.65625, -12.078125, -11.5, -10.921875, -10.34375, -9.765625, -9.1875, -8.609375, -8.03125, -7.453125, -6.875, -6.296875, -5.71875, -5.140625, -4.5625, -3.984375, -3.40625, -2.828125, -2.25, -1.671875, -1.09375, -0.515625, 0.0625, 0.640625, 1.21875, 1.796875, 2.375, 2.953125, 3.53125, 4.109375, 4.6875, 5.265625, 5.84375, 6.421875, 7.0, 7.578125, 8.15625, 8.734375, 9.3125, 9.890625, 10.46875, 11.046875, 11.625, 12.203125, 12.78125, 13.359375, 13.9375, 14.515625, 15.09375, 15.671875, 16.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 11.0, 7.0, 15.0, 22.0, 13.0, 22.0, 19.0, 33.0, 44.0, 56.0, 49.0, 54.0, 68.0, 65.0, 66.0, 77.0, 54.0, 48.0, 45.0, 45.0, 32.0, 37.0, 19.0, 20.0, 13.0, 7.0, 14.0, 5.0, 8.0, 3.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.2828483581543, -34.0324592590332, -32.78207015991211, -31.53168296813965, -30.281293869018555, -29.03090476989746, -27.780517578125, -26.530128479003906, -25.279739379882812, -24.02935028076172, -22.778961181640625, -21.528573989868164, -20.27818489074707, -19.027795791625977, -17.777408599853516, -16.527019500732422, -15.276630401611328, -14.026241302490234, -12.775853157043457, -11.52546501159668, -10.275075912475586, -9.024686813354492, -7.774298667907715, -6.5239105224609375, -5.273521423339844, -4.023132801055908, -2.7727441787719727, -1.522355556488037, -0.27196693420410156, 0.978421688079834, 2.2288103103637695, 3.479198455810547, 4.729587554931641, 5.979976177215576, 7.230364799499512, 8.480752944946289, 9.731142044067383, 10.981531143188477, 12.231919288635254, 13.482307434082031, 14.732696533203125, 15.983085632324219, 17.233474731445312, 18.483861923217773, 19.734251022338867, 20.98464012145996, 22.235027313232422, 23.485416412353516, 24.73580551147461, 25.986194610595703, 27.236583709716797, 28.486970901489258, 29.73736000061035, 30.987749099731445, 32.238136291503906, 33.488525390625, 34.738914489746094, 35.98930358886719, 37.23969268798828, 38.490081787109375, 39.74047088623047, 40.9908561706543, 42.24124526977539, 43.491634368896484, 44.74202346801758]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 4.0, 4.0, 9.0, 11.0, 18.0, 15.0, 21.0, 21.0, 16.0, 26.0, 22.0, 25.0, 27.0, 29.0, 33.0, 32.0, 35.0, 37.0, 36.0, 43.0, 41.0, 42.0, 27.0, 32.0, 39.0, 48.0, 28.0, 24.0, 42.0, 31.0, 19.0, 17.0, 24.0, 19.0, 15.0, 19.0, 10.0, 10.0, 3.0, 9.0, 10.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.321773529052734, -30.385770797729492, -29.44976806640625, -28.513765335083008, -27.577762603759766, -26.641759872436523, -25.70575714111328, -24.76975440979004, -23.833751678466797, -22.897748947143555, -21.961746215820312, -21.02574348449707, -20.089740753173828, -19.153738021850586, -18.217735290527344, -17.2817325592041, -16.34572982788086, -15.409727096557617, -14.473724365234375, -13.537721633911133, -12.60171890258789, -11.665716171264648, -10.729713439941406, -9.793710708618164, -8.857709884643555, -7.9217071533203125, -6.98570442199707, -6.049701690673828, -5.113698959350586, -4.177696704864502, -3.2416939735412598, -2.3056912422180176, -1.3696880340576172, -0.4336853623390198, 0.5023173093795776, 1.4383199214935303, 2.3743226528167725, 3.3103251457214355, 4.246327877044678, 5.18233060836792, 6.118333339691162, 7.054336071014404, 7.9903388023376465, 8.92634105682373, 9.862343788146973, 10.798346519470215, 11.734349250793457, 12.6703519821167, 13.606354713439941, 14.542357444763184, 15.478360176086426, 16.41436195373535, 17.350364685058594, 18.286367416381836, 19.222370147705078, 20.15837287902832, 21.094375610351562, 22.030378341674805, 22.966381072998047, 23.90238380432129, 24.83838653564453, 25.774389266967773, 26.710391998291016, 27.646394729614258, 28.5823974609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 9.0, 10.0, 18.0, 18.0, 23.0, 59.0, 69.0, 131.0, 246.0, 431.0, 773.0, 1331.0, 2332.0, 4549.0, 8796.0, 18500.0, 43790.0, 125115.0, 399205.0, 291256.0, 88913.0, 33156.0, 14435.0, 7031.0, 3709.0, 2040.0, 1072.0, 673.0, 362.0, 191.0, 117.0, 63.0, 42.0, 28.0, 16.0, 13.0, 9.0, 6.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.625, -80.25390625, -77.8828125, -75.51171875, -73.140625, -70.76953125, -68.3984375, -66.02734375, -63.65625, -61.28515625, -58.9140625, -56.54296875, -54.171875, -51.80078125, -49.4296875, -47.05859375, -44.6875, -42.31640625, -39.9453125, -37.57421875, -35.203125, -32.83203125, -30.4609375, -28.08984375, -25.71875, -23.34765625, -20.9765625, -18.60546875, -16.234375, -13.86328125, -11.4921875, -9.12109375, -6.75, -4.37890625, -2.0078125, 0.36328125, 2.734375, 5.10546875, 7.4765625, 9.84765625, 12.21875, 14.58984375, 16.9609375, 19.33203125, 21.703125, 24.07421875, 26.4453125, 28.81640625, 31.1875, 33.55859375, 35.9296875, 38.30078125, 40.671875, 43.04296875, 45.4140625, 47.78515625, 50.15625, 52.52734375, 54.8984375, 57.26953125, 59.640625, 62.01171875, 64.3828125, 66.75390625, 69.125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 8.0, 21.0, 12.0, 17.0, 22.0, 14.0, 16.0, 20.0, 20.0, 28.0, 31.0, 39.0, 29.0, 43.0, 41.0, 41.0, 35.0, 37.0, 41.0, 49.0, 30.0, 25.0, 46.0, 36.0, 31.0, 39.0, 34.0, 23.0, 18.0, 12.0, 18.0, 25.0, 11.0, 13.0, 11.0, 11.0, 2.0, 8.0, 12.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-31.828125, -30.891845703125, -29.95556640625, -29.019287109375, -28.0830078125, -27.146728515625, -26.21044921875, -25.274169921875, -24.337890625, -23.401611328125, -22.46533203125, -21.529052734375, -20.5927734375, -19.656494140625, -18.72021484375, -17.783935546875, -16.84765625, -15.911376953125, -14.97509765625, -14.038818359375, -13.1025390625, -12.166259765625, -11.22998046875, -10.293701171875, -9.357421875, -8.421142578125, -7.48486328125, -6.548583984375, -5.6123046875, -4.676025390625, -3.73974609375, -2.803466796875, -1.8671875, -0.930908203125, 0.00537109375, 0.941650390625, 1.8779296875, 2.814208984375, 3.75048828125, 4.686767578125, 5.623046875, 6.559326171875, 7.49560546875, 8.431884765625, 9.3681640625, 10.304443359375, 11.24072265625, 12.177001953125, 13.11328125, 14.049560546875, 14.98583984375, 15.922119140625, 16.8583984375, 17.794677734375, 18.73095703125, 19.667236328125, 20.603515625, 21.539794921875, 22.47607421875, 23.412353515625, 24.3486328125, 25.284912109375, 26.22119140625, 27.157470703125, 28.09375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 7.0, 18.0, 25.0, 33.0, 66.0, 93.0, 105.0, 153.0, 232.0, 335.0, 444.0, 695.0, 963.0, 1489.0, 2329.0, 3883.0, 6533.0, 11740.0, 21125.0, 42824.0, 94243.0, 252209.0, 353056.0, 134892.0, 57377.0, 27909.0, 14417.0, 8135.0, 4753.0, 2976.0, 1858.0, 1141.0, 770.0, 495.0, 367.0, 271.0, 165.0, 107.0, 93.0, 51.0, 45.0, 28.0, 24.0, 25.0, 9.0, 9.0, 6.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-57.90625, -56.0498046875, -54.193359375, -52.3369140625, -50.48046875, -48.6240234375, -46.767578125, -44.9111328125, -43.0546875, -41.1982421875, -39.341796875, -37.4853515625, -35.62890625, -33.7724609375, -31.916015625, -30.0595703125, -28.203125, -26.3466796875, -24.490234375, -22.6337890625, -20.77734375, -18.9208984375, -17.064453125, -15.2080078125, -13.3515625, -11.4951171875, -9.638671875, -7.7822265625, -5.92578125, -4.0693359375, -2.212890625, -0.3564453125, 1.5, 3.3564453125, 5.212890625, 7.0693359375, 8.92578125, 10.7822265625, 12.638671875, 14.4951171875, 16.3515625, 18.2080078125, 20.064453125, 21.9208984375, 23.77734375, 25.6337890625, 27.490234375, 29.3466796875, 31.203125, 33.0595703125, 34.916015625, 36.7724609375, 38.62890625, 40.4853515625, 42.341796875, 44.1982421875, 46.0546875, 47.9111328125, 49.767578125, 51.6240234375, 53.48046875, 55.3369140625, 57.193359375, 59.0498046875, 60.90625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 9.0, 4.0, 12.0, 10.0, 12.0, 10.0, 14.0, 14.0, 27.0, 35.0, 27.0, 27.0, 25.0, 33.0, 34.0, 36.0, 35.0, 39.0, 45.0, 46.0, 43.0, 39.0, 39.0, 42.0, 38.0, 39.0, 35.0, 27.0, 29.0, 20.0, 36.0, 22.0, 20.0, 15.0, 11.0, 10.0, 10.0, 6.0, 7.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.5, -19.8662109375, -19.232421875, -18.5986328125, -17.96484375, -17.3310546875, -16.697265625, -16.0634765625, -15.4296875, -14.7958984375, -14.162109375, -13.5283203125, -12.89453125, -12.2607421875, -11.626953125, -10.9931640625, -10.359375, -9.7255859375, -9.091796875, -8.4580078125, -7.82421875, -7.1904296875, -6.556640625, -5.9228515625, -5.2890625, -4.6552734375, -4.021484375, -3.3876953125, -2.75390625, -2.1201171875, -1.486328125, -0.8525390625, -0.21875, 0.4150390625, 1.048828125, 1.6826171875, 2.31640625, 2.9501953125, 3.583984375, 4.2177734375, 4.8515625, 5.4853515625, 6.119140625, 6.7529296875, 7.38671875, 8.0205078125, 8.654296875, 9.2880859375, 9.921875, 10.5556640625, 11.189453125, 11.8232421875, 12.45703125, 13.0908203125, 13.724609375, 14.3583984375, 14.9921875, 15.6259765625, 16.259765625, 16.8935546875, 17.52734375, 18.1611328125, 18.794921875, 19.4287109375, 20.0625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 13.0, 11.0, 21.0, 16.0, 30.0, 40.0, 68.0, 56.0, 100.0, 138.0, 202.0, 278.0, 390.0, 620.0, 882.0, 1305.0, 2034.0, 3204.0, 5279.0, 9869.0, 21683.0, 67695.0, 369025.0, 437182.0, 78303.0, 24045.0, 10669.0, 5643.0, 3262.0, 2040.0, 1345.0, 913.0, 611.0, 424.0, 308.0, 233.0, 182.0, 131.0, 82.0, 74.0, 42.0, 27.0, 20.0, 13.0, 14.0, 12.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.8125, -25.948974609375, -25.08544921875, -24.221923828125, -23.3583984375, -22.494873046875, -21.63134765625, -20.767822265625, -19.904296875, -19.040771484375, -18.17724609375, -17.313720703125, -16.4501953125, -15.586669921875, -14.72314453125, -13.859619140625, -12.99609375, -12.132568359375, -11.26904296875, -10.405517578125, -9.5419921875, -8.678466796875, -7.81494140625, -6.951416015625, -6.087890625, -5.224365234375, -4.36083984375, -3.497314453125, -2.6337890625, -1.770263671875, -0.90673828125, -0.043212890625, 0.8203125, 1.683837890625, 2.54736328125, 3.410888671875, 4.2744140625, 5.137939453125, 6.00146484375, 6.864990234375, 7.728515625, 8.592041015625, 9.45556640625, 10.319091796875, 11.1826171875, 12.046142578125, 12.90966796875, 13.773193359375, 14.63671875, 15.500244140625, 16.36376953125, 17.227294921875, 18.0908203125, 18.954345703125, 19.81787109375, 20.681396484375, 21.544921875, 22.408447265625, 23.27197265625, 24.135498046875, 24.9990234375, 25.862548828125, 26.72607421875, 27.589599609375, 28.453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 10.0, 4.0, 8.0, 9.0, 22.0, 45.0, 80.0, 138.0, 200.0, 193.0, 116.0, 68.0, 43.0, 28.0, 11.0, 5.0, 9.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003154754638671875, -0.0030614733695983887, -0.0029681921005249023, -0.002874910831451416, -0.0027816295623779297, -0.0026883482933044434, -0.002595067024230957, -0.0025017857551574707, -0.0024085044860839844, -0.002315223217010498, -0.0022219419479370117, -0.0021286606788635254, -0.002035379409790039, -0.0019420981407165527, -0.0018488168716430664, -0.00175553560256958, -0.0016622543334960938, -0.0015689730644226074, -0.001475691795349121, -0.0013824105262756348, -0.0012891292572021484, -0.0011958479881286621, -0.0011025667190551758, -0.0010092854499816895, -0.0009160041809082031, -0.0008227229118347168, -0.0007294416427612305, -0.0006361603736877441, -0.0005428791046142578, -0.0004495978355407715, -0.00035631656646728516, -0.00026303529739379883, -0.0001697540283203125, -7.647275924682617e-05, 1.6808509826660156e-05, 0.00011008977890014648, 0.0002033710479736328, 0.00029665231704711914, 0.00038993358612060547, 0.0004832148551940918, 0.0005764961242675781, 0.0006697773933410645, 0.0007630586624145508, 0.0008563399314880371, 0.0009496212005615234, 0.0010429024696350098, 0.001136183738708496, 0.0012294650077819824, 0.0013227462768554688, 0.001416027545928955, 0.0015093088150024414, 0.0016025900840759277, 0.001695871353149414, 0.0017891526222229004, 0.0018824338912963867, 0.001975715160369873, 0.0020689964294433594, 0.0021622776985168457, 0.002255558967590332, 0.0023488402366638184, 0.0024421215057373047, 0.002535402774810791, 0.0026286840438842773, 0.0027219653129577637, 0.00281524658203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 14.0, 11.0, 25.0, 34.0, 37.0, 61.0, 115.0, 145.0, 222.0, 362.0, 554.0, 903.0, 1332.0, 2044.0, 3206.0, 5177.0, 8702.0, 17189.0, 41884.0, 147818.0, 495454.0, 219652.0, 56002.0, 21168.0, 10435.0, 5876.0, 3680.0, 2288.0, 1525.0, 924.0, 600.0, 401.0, 242.0, 191.0, 110.0, 49.0, 46.0, 25.0, 27.0, 11.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-32.90625, -31.9560546875, -31.005859375, -30.0556640625, -29.10546875, -28.1552734375, -27.205078125, -26.2548828125, -25.3046875, -24.3544921875, -23.404296875, -22.4541015625, -21.50390625, -20.5537109375, -19.603515625, -18.6533203125, -17.703125, -16.7529296875, -15.802734375, -14.8525390625, -13.90234375, -12.9521484375, -12.001953125, -11.0517578125, -10.1015625, -9.1513671875, -8.201171875, -7.2509765625, -6.30078125, -5.3505859375, -4.400390625, -3.4501953125, -2.5, -1.5498046875, -0.599609375, 0.3505859375, 1.30078125, 2.2509765625, 3.201171875, 4.1513671875, 5.1015625, 6.0517578125, 7.001953125, 7.9521484375, 8.90234375, 9.8525390625, 10.802734375, 11.7529296875, 12.703125, 13.6533203125, 14.603515625, 15.5537109375, 16.50390625, 17.4541015625, 18.404296875, 19.3544921875, 20.3046875, 21.2548828125, 22.205078125, 23.1552734375, 24.10546875, 25.0556640625, 26.005859375, 26.9560546875, 27.90625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 5.0, 7.0, 10.0, 13.0, 23.0, 30.0, 41.0, 55.0, 89.0, 108.0, 109.0, 96.0, 91.0, 67.0, 57.0, 38.0, 26.0, 17.0, 17.0, 8.0, 11.0, 11.0, 3.0, 8.0, 3.0, 6.0, 4.0, 9.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-8.8984375, -8.649658203125, -8.40087890625, -8.152099609375, -7.9033203125, -7.654541015625, -7.40576171875, -7.156982421875, -6.908203125, -6.659423828125, -6.41064453125, -6.161865234375, -5.9130859375, -5.664306640625, -5.41552734375, -5.166748046875, -4.91796875, -4.669189453125, -4.42041015625, -4.171630859375, -3.9228515625, -3.674072265625, -3.42529296875, -3.176513671875, -2.927734375, -2.678955078125, -2.43017578125, -2.181396484375, -1.9326171875, -1.683837890625, -1.43505859375, -1.186279296875, -0.9375, -0.688720703125, -0.43994140625, -0.191162109375, 0.0576171875, 0.306396484375, 0.55517578125, 0.803955078125, 1.052734375, 1.301513671875, 1.55029296875, 1.799072265625, 2.0478515625, 2.296630859375, 2.54541015625, 2.794189453125, 3.04296875, 3.291748046875, 3.54052734375, 3.789306640625, 4.0380859375, 4.286865234375, 4.53564453125, 4.784423828125, 5.033203125, 5.281982421875, 5.53076171875, 5.779541015625, 6.0283203125, 6.277099609375, 6.52587890625, 6.774658203125, 7.0234375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 5.0, 10.0, 15.0, 11.0, 10.0, 20.0, 19.0, 24.0, 34.0, 38.0, 44.0, 58.0, 62.0, 66.0, 58.0, 65.0, 64.0, 58.0, 57.0, 53.0, 39.0, 35.0, 26.0, 25.0, 17.0, 9.0, 14.0, 11.0, 10.0, 8.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.382720947265625, -27.211339950561523, -26.03995704650879, -24.868576049804688, -23.697195053100586, -22.525814056396484, -21.35443115234375, -20.18305015563965, -19.011669158935547, -17.840288162231445, -16.66890525817871, -15.49752426147461, -14.326143264770508, -13.15476131439209, -11.983379364013672, -10.81199836730957, -9.640615463256836, -8.469233512878418, -7.297852516174316, -6.126470565795898, -4.955089092254639, -3.783707618713379, -2.612325668334961, -1.4409446716308594, -0.2695627212524414, 0.9018188714981079, 2.0732004642486572, 3.244582176208496, 4.415963649749756, 5.587345123291016, 6.758727073669434, 7.930108070373535, 9.101490020751953, 10.272871971130371, 11.444252967834473, 12.61563491821289, 13.787015914916992, 14.95839786529541, 16.129779815673828, 17.30116081237793, 18.47254180908203, 19.643922805786133, 20.815305709838867, 21.98668670654297, 23.15806770324707, 24.329448699951172, 25.500831604003906, 26.672212600708008, 27.843595504760742, 29.014976501464844, 30.186359405517578, 31.35774040222168, 32.52912139892578, 33.700504302978516, 34.87188720703125, 36.04326629638672, 37.21464920043945, 38.38603210449219, 39.557411193847656, 40.72879409790039, 41.900177001953125, 43.071556091308594, 44.24293899536133, 45.41432189941406, 46.58570098876953]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 7.0, 3.0, 8.0, 8.0, 11.0, 12.0, 16.0, 17.0, 13.0, 21.0, 13.0, 31.0, 23.0, 34.0, 36.0, 17.0, 39.0, 30.0, 36.0, 36.0, 42.0, 35.0, 31.0, 45.0, 34.0, 25.0, 27.0, 37.0, 42.0, 33.0, 29.0, 22.0, 21.0, 22.0, 21.0, 22.0, 15.0, 14.0, 13.0, 11.0, 6.0, 12.0, 8.0, 4.0, 7.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-28.52808380126953, -27.666709899902344, -26.80533790588379, -25.9439640045166, -25.082592010498047, -24.22121810913086, -23.359844207763672, -22.498472213745117, -21.63709831237793, -20.775724411010742, -19.914352416992188, -19.052978515625, -18.191606521606445, -17.330232620239258, -16.468860626220703, -15.607486724853516, -14.746113777160645, -13.884740829467773, -13.023367881774902, -12.161994934082031, -11.300621032714844, -10.439248085021973, -9.577875137329102, -8.716501235961914, -7.855128765106201, -6.99375581741333, -6.132382392883301, -5.27100944519043, -4.409636497497559, -3.5482630729675293, -2.686890125274658, -1.825516700744629, -0.9641437530517578, -0.10277062654495239, 0.758602499961853, 1.6199755668640137, 2.481348752975464, 3.342721939086914, 4.204094886779785, 5.0654683113098145, 5.9268412590026855, 6.788214206695557, 7.649587631225586, 8.510960578918457, 9.372333526611328, 10.233707427978516, 11.09507942199707, 11.956453323364258, 12.817826271057129, 13.67919921875, 14.540572166442871, 15.401945114135742, 16.26331901550293, 17.124691009521484, 17.986064910888672, 18.84743881225586, 19.708810806274414, 20.5701847076416, 21.431556701660156, 22.292930603027344, 23.1543025970459, 24.015676498413086, 24.87704849243164, 25.738422393798828, 26.599796295166016]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 9.0, 7.0, 11.0, 16.0, 13.0, 35.0, 46.0, 55.0, 85.0, 152.0, 186.0, 289.0, 373.0, 546.0, 788.0, 1116.0, 1635.0, 2256.0, 3115.0, 4468.0, 6286.0, 9171.0, 13442.0, 19462.0, 28856.0, 43676.0, 64935.0, 98087.0, 139287.0, 164778.0, 141518.0, 99244.0, 66553.0, 44216.0, 29190.0, 19888.0, 13351.0, 9428.0, 6588.0, 4575.0, 3161.0, 2293.0, 1555.0, 1148.0, 852.0, 533.0, 388.0, 281.0, 191.0, 128.0, 103.0, 63.0, 45.0, 36.0, 17.0, 9.0, 14.0, 5.0, 3.0, 4.0, 4.0, 3.0], "bins": [-29.28125, -28.352294921875, -27.42333984375, -26.494384765625, -25.5654296875, -24.636474609375, -23.70751953125, -22.778564453125, -21.849609375, -20.920654296875, -19.99169921875, -19.062744140625, -18.1337890625, -17.204833984375, -16.27587890625, -15.346923828125, -14.41796875, -13.489013671875, -12.56005859375, -11.631103515625, -10.7021484375, -9.773193359375, -8.84423828125, -7.915283203125, -6.986328125, -6.057373046875, -5.12841796875, -4.199462890625, -3.2705078125, -2.341552734375, -1.41259765625, -0.483642578125, 0.4453125, 1.374267578125, 2.30322265625, 3.232177734375, 4.1611328125, 5.090087890625, 6.01904296875, 6.947998046875, 7.876953125, 8.805908203125, 9.73486328125, 10.663818359375, 11.5927734375, 12.521728515625, 13.45068359375, 14.379638671875, 15.30859375, 16.237548828125, 17.16650390625, 18.095458984375, 19.0244140625, 19.953369140625, 20.88232421875, 21.811279296875, 22.740234375, 23.669189453125, 24.59814453125, 25.527099609375, 26.4560546875, 27.385009765625, 28.31396484375, 29.242919921875, 30.171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 7.0, 4.0, 4.0, 4.0, 4.0, 4.0, 15.0, 12.0, 16.0, 17.0, 11.0, 13.0, 27.0, 19.0, 28.0, 34.0, 36.0, 27.0, 29.0, 43.0, 36.0, 34.0, 32.0, 39.0, 30.0, 44.0, 31.0, 33.0, 29.0, 32.0, 36.0, 39.0, 37.0, 25.0, 26.0, 19.0, 14.0, 21.0, 14.0, 17.0, 11.0, 11.0, 5.0, 9.0, 12.0, 5.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-27.1875, -26.344970703125, -25.50244140625, -24.659912109375, -23.8173828125, -22.974853515625, -22.13232421875, -21.289794921875, -20.447265625, -19.604736328125, -18.76220703125, -17.919677734375, -17.0771484375, -16.234619140625, -15.39208984375, -14.549560546875, -13.70703125, -12.864501953125, -12.02197265625, -11.179443359375, -10.3369140625, -9.494384765625, -8.65185546875, -7.809326171875, -6.966796875, -6.124267578125, -5.28173828125, -4.439208984375, -3.5966796875, -2.754150390625, -1.91162109375, -1.069091796875, -0.2265625, 0.615966796875, 1.45849609375, 2.301025390625, 3.1435546875, 3.986083984375, 4.82861328125, 5.671142578125, 6.513671875, 7.356201171875, 8.19873046875, 9.041259765625, 9.8837890625, 10.726318359375, 11.56884765625, 12.411376953125, 13.25390625, 14.096435546875, 14.93896484375, 15.781494140625, 16.6240234375, 17.466552734375, 18.30908203125, 19.151611328125, 19.994140625, 20.836669921875, 21.67919921875, 22.521728515625, 23.3642578125, 24.206787109375, 25.04931640625, 25.891845703125, 26.734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 14.0, 10.0, 21.0, 26.0, 50.0, 72.0, 102.0, 174.0, 274.0, 400.0, 641.0, 995.0, 1611.0, 2712.0, 4543.0, 7240.0, 12187.0, 21308.0, 37633.0, 69287.0, 128201.0, 216967.0, 228647.0, 140303.0, 76502.0, 41357.0, 23334.0, 13451.0, 8081.0, 4698.0, 2903.0, 1823.0, 1102.0, 721.0, 402.0, 262.0, 171.0, 103.0, 73.0, 46.0, 35.0, 28.0, 18.0, 13.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.53125, -43.05078125, -41.5703125, -40.08984375, -38.609375, -37.12890625, -35.6484375, -34.16796875, -32.6875, -31.20703125, -29.7265625, -28.24609375, -26.765625, -25.28515625, -23.8046875, -22.32421875, -20.84375, -19.36328125, -17.8828125, -16.40234375, -14.921875, -13.44140625, -11.9609375, -10.48046875, -9.0, -7.51953125, -6.0390625, -4.55859375, -3.078125, -1.59765625, -0.1171875, 1.36328125, 2.84375, 4.32421875, 5.8046875, 7.28515625, 8.765625, 10.24609375, 11.7265625, 13.20703125, 14.6875, 16.16796875, 17.6484375, 19.12890625, 20.609375, 22.08984375, 23.5703125, 25.05078125, 26.53125, 28.01171875, 29.4921875, 30.97265625, 32.453125, 33.93359375, 35.4140625, 36.89453125, 38.375, 39.85546875, 41.3359375, 42.81640625, 44.296875, 45.77734375, 47.2578125, 48.73828125, 50.21875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 11.0, 11.0, 9.0, 12.0, 10.0, 17.0, 21.0, 19.0, 22.0, 27.0, 36.0, 26.0, 39.0, 48.0, 39.0, 51.0, 42.0, 45.0, 48.0, 36.0, 49.0, 40.0, 51.0, 33.0, 34.0, 38.0, 22.0, 29.0, 18.0, 21.0, 19.0, 14.0, 8.0, 10.0, 11.0, 5.0, 4.0, 9.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.3125, -18.662353515625, -18.01220703125, -17.362060546875, -16.7119140625, -16.061767578125, -15.41162109375, -14.761474609375, -14.111328125, -13.461181640625, -12.81103515625, -12.160888671875, -11.5107421875, -10.860595703125, -10.21044921875, -9.560302734375, -8.91015625, -8.260009765625, -7.60986328125, -6.959716796875, -6.3095703125, -5.659423828125, -5.00927734375, -4.359130859375, -3.708984375, -3.058837890625, -2.40869140625, -1.758544921875, -1.1083984375, -0.458251953125, 0.19189453125, 0.842041015625, 1.4921875, 2.142333984375, 2.79248046875, 3.442626953125, 4.0927734375, 4.742919921875, 5.39306640625, 6.043212890625, 6.693359375, 7.343505859375, 7.99365234375, 8.643798828125, 9.2939453125, 9.944091796875, 10.59423828125, 11.244384765625, 11.89453125, 12.544677734375, 13.19482421875, 13.844970703125, 14.4951171875, 15.145263671875, 15.79541015625, 16.445556640625, 17.095703125, 17.745849609375, 18.39599609375, 19.046142578125, 19.6962890625, 20.346435546875, 20.99658203125, 21.646728515625, 22.296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 3.0, 8.0, 10.0, 27.0, 42.0, 48.0, 88.0, 115.0, 188.0, 281.0, 481.0, 731.0, 1090.0, 1844.0, 3102.0, 5097.0, 9015.0, 15700.0, 28433.0, 52139.0, 98316.0, 183573.0, 255465.0, 179427.0, 96880.0, 51284.0, 28008.0, 15482.0, 8730.0, 5097.0, 3049.0, 1794.0, 1062.0, 676.0, 412.0, 283.0, 192.0, 123.0, 79.0, 65.0, 37.0, 20.0, 18.0, 13.0, 11.0, 7.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9453125, -12.4908447265625, -12.036376953125, -11.5819091796875, -11.12744140625, -10.6729736328125, -10.218505859375, -9.7640380859375, -9.3095703125, -8.8551025390625, -8.400634765625, -7.9461669921875, -7.49169921875, -7.0372314453125, -6.582763671875, -6.1282958984375, -5.673828125, -5.2193603515625, -4.764892578125, -4.3104248046875, -3.85595703125, -3.4014892578125, -2.947021484375, -2.4925537109375, -2.0380859375, -1.5836181640625, -1.129150390625, -0.6746826171875, -0.22021484375, 0.2342529296875, 0.688720703125, 1.1431884765625, 1.59765625, 2.0521240234375, 2.506591796875, 2.9610595703125, 3.41552734375, 3.8699951171875, 4.324462890625, 4.7789306640625, 5.2333984375, 5.6878662109375, 6.142333984375, 6.5968017578125, 7.05126953125, 7.5057373046875, 7.960205078125, 8.4146728515625, 8.869140625, 9.3236083984375, 9.778076171875, 10.2325439453125, 10.68701171875, 11.1414794921875, 11.595947265625, 12.0504150390625, 12.5048828125, 12.9593505859375, 13.413818359375, 13.8682861328125, 14.32275390625, 14.7772216796875, 15.231689453125, 15.6861572265625, 16.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 5.0, 8.0, 8.0, 9.0, 8.0, 16.0, 17.0, 15.0, 22.0, 33.0, 42.0, 37.0, 56.0, 52.0, 68.0, 75.0, 76.0, 75.0, 62.0, 61.0, 49.0, 41.0, 33.0, 31.0, 18.0, 16.0, 17.0, 13.0, 8.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012683868408203125, -0.0012215673923492432, -0.0011747479438781738, -0.0011279284954071045, -0.0010811090469360352, -0.0010342895984649658, -0.0009874701499938965, -0.0009406507015228271, -0.0008938312530517578, -0.0008470118045806885, -0.0008001923561096191, -0.0007533729076385498, -0.0007065534591674805, -0.0006597340106964111, -0.0006129145622253418, -0.0005660951137542725, -0.0005192756652832031, -0.0004724562168121338, -0.00042563676834106445, -0.0003788173198699951, -0.0003319978713989258, -0.00028517842292785645, -0.0002383589744567871, -0.00019153952598571777, -0.00014472007751464844, -9.79006290435791e-05, -5.1081180572509766e-05, -4.26173210144043e-06, 4.2557716369628906e-05, 8.937716484069824e-05, 0.00013619661331176758, 0.00018301606178283691, 0.00022983551025390625, 0.0002766549587249756, 0.0003234744071960449, 0.00037029385566711426, 0.0004171133041381836, 0.00046393275260925293, 0.0005107522010803223, 0.0005575716495513916, 0.0006043910980224609, 0.0006512105464935303, 0.0006980299949645996, 0.0007448494434356689, 0.0007916688919067383, 0.0008384883403778076, 0.000885307788848877, 0.0009321272373199463, 0.0009789466857910156, 0.001025766134262085, 0.0010725855827331543, 0.0011194050312042236, 0.001166224479675293, 0.0012130439281463623, 0.0012598633766174316, 0.001306682825088501, 0.0013535022735595703, 0.0014003217220306396, 0.001447141170501709, 0.0014939606189727783, 0.0015407800674438477, 0.001587599515914917, 0.0016344189643859863, 0.0016812384128570557, 0.001728057861328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 3.0, 12.0, 8.0, 8.0, 18.0, 27.0, 28.0, 44.0, 85.0, 130.0, 198.0, 274.0, 434.0, 679.0, 1068.0, 1721.0, 2733.0, 4437.0, 7395.0, 12285.0, 20579.0, 35165.0, 60715.0, 104789.0, 173913.0, 216022.0, 166123.0, 100225.0, 56791.0, 33186.0, 19402.0, 11586.0, 6958.0, 4321.0, 2586.0, 1671.0, 1064.0, 678.0, 425.0, 227.0, 193.0, 116.0, 66.0, 61.0, 46.0, 21.0, 11.0, 13.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.9736328125, -10.587890625, -10.2021484375, -9.81640625, -9.4306640625, -9.044921875, -8.6591796875, -8.2734375, -7.8876953125, -7.501953125, -7.1162109375, -6.73046875, -6.3447265625, -5.958984375, -5.5732421875, -5.1875, -4.8017578125, -4.416015625, -4.0302734375, -3.64453125, -3.2587890625, -2.873046875, -2.4873046875, -2.1015625, -1.7158203125, -1.330078125, -0.9443359375, -0.55859375, -0.1728515625, 0.212890625, 0.5986328125, 0.984375, 1.3701171875, 1.755859375, 2.1416015625, 2.52734375, 2.9130859375, 3.298828125, 3.6845703125, 4.0703125, 4.4560546875, 4.841796875, 5.2275390625, 5.61328125, 5.9990234375, 6.384765625, 6.7705078125, 7.15625, 7.5419921875, 7.927734375, 8.3134765625, 8.69921875, 9.0849609375, 9.470703125, 9.8564453125, 10.2421875, 10.6279296875, 11.013671875, 11.3994140625, 11.78515625, 12.1708984375, 12.556640625, 12.9423828125, 13.328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 4.0, 8.0, 4.0, 4.0, 10.0, 6.0, 11.0, 12.0, 24.0, 22.0, 25.0, 17.0, 30.0, 35.0, 39.0, 31.0, 41.0, 45.0, 65.0, 54.0, 64.0, 62.0, 52.0, 45.0, 38.0, 41.0, 39.0, 21.0, 18.0, 23.0, 13.0, 15.0, 15.0, 9.0, 9.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 6.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-3.482421875, -3.3782958984375, -3.274169921875, -3.1700439453125, -3.06591796875, -2.9617919921875, -2.857666015625, -2.7535400390625, -2.6494140625, -2.5452880859375, -2.441162109375, -2.3370361328125, -2.23291015625, -2.1287841796875, -2.024658203125, -1.9205322265625, -1.81640625, -1.7122802734375, -1.608154296875, -1.5040283203125, -1.39990234375, -1.2957763671875, -1.191650390625, -1.0875244140625, -0.9833984375, -0.8792724609375, -0.775146484375, -0.6710205078125, -0.56689453125, -0.4627685546875, -0.358642578125, -0.2545166015625, -0.150390625, -0.0462646484375, 0.057861328125, 0.1619873046875, 0.26611328125, 0.3702392578125, 0.474365234375, 0.5784912109375, 0.6826171875, 0.7867431640625, 0.890869140625, 0.9949951171875, 1.09912109375, 1.2032470703125, 1.307373046875, 1.4114990234375, 1.515625, 1.6197509765625, 1.723876953125, 1.8280029296875, 1.93212890625, 2.0362548828125, 2.140380859375, 2.2445068359375, 2.3486328125, 2.4527587890625, 2.556884765625, 2.6610107421875, 2.76513671875, 2.8692626953125, 2.973388671875, 3.0775146484375, 3.181640625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 10.0, 2.0, 7.0, 13.0, 11.0, 12.0, 13.0, 24.0, 17.0, 23.0, 29.0, 39.0, 40.0, 58.0, 55.0, 57.0, 61.0, 72.0, 48.0, 47.0, 65.0, 43.0, 50.0, 34.0, 28.0, 20.0, 19.0, 16.0, 18.0, 12.0, 9.0, 10.0, 8.0, 5.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.04131317138672, -32.99440383911133, -31.947498321533203, -30.900588989257812, -29.853681564331055, -28.806774139404297, -27.759864807128906, -26.71295738220215, -25.66604995727539, -24.619142532348633, -23.572235107421875, -22.525325775146484, -21.478418350219727, -20.43151092529297, -19.384601593017578, -18.33769416809082, -17.290786743164062, -16.243879318237305, -15.19697093963623, -14.150062561035156, -13.103155136108398, -12.05624771118164, -11.009339332580566, -9.962430953979492, -8.915523529052734, -7.868615627288818, -6.821707725524902, -5.774799823760986, -4.72789192199707, -3.6809840202331543, -2.6340761184692383, -1.5871682167053223, -0.5402565002441406, 0.5066514015197754, 1.5535593032836914, 2.6004672050476074, 3.6473751068115234, 4.6942830085754395, 5.7411909103393555, 6.7880988121032715, 7.8350067138671875, 8.881914138793945, 9.92882251739502, 10.975730895996094, 12.022638320922852, 13.06954574584961, 14.116454124450684, 15.163362503051758, 16.210269927978516, 17.257177352905273, 18.30408477783203, 19.350994110107422, 20.39790153503418, 21.444808959960938, 22.491718292236328, 23.538625717163086, 24.585533142089844, 25.6324405670166, 26.67934799194336, 27.72625732421875, 28.773164749145508, 29.820072174072266, 30.866981506347656, 31.913888931274414, 32.96079635620117]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 6.0, 5.0, 5.0, 9.0, 9.0, 7.0, 19.0, 13.0, 18.0, 18.0, 15.0, 17.0, 29.0, 27.0, 29.0, 31.0, 20.0, 28.0, 32.0, 26.0, 42.0, 27.0, 17.0, 32.0, 49.0, 33.0, 37.0, 40.0, 23.0, 34.0, 25.0, 24.0, 25.0, 20.0, 30.0, 12.0, 22.0, 20.0, 26.0, 15.0, 15.0, 16.0, 8.0, 9.0, 12.0, 5.0, 1.0, 5.0, 4.0, 2.0, 0.0, 4.0, 4.0], "bins": [-28.643796920776367, -27.812063217163086, -26.980331420898438, -26.148597717285156, -25.316865921020508, -24.485132217407227, -23.653400421142578, -22.821666717529297, -21.989933013916016, -21.158199310302734, -20.326467514038086, -19.494733810424805, -18.663002014160156, -17.831268310546875, -16.999534606933594, -16.167802810668945, -15.336071014404297, -14.504338264465332, -13.672605514526367, -12.840871810913086, -12.009140014648438, -11.177406311035156, -10.345673561096191, -9.513940811157227, -8.682208061218262, -7.850475311279297, -7.018742561340332, -6.187009334564209, -5.355276584625244, -4.523543834686279, -3.6918106079101562, -2.8600778579711914, -2.0283432006835938, -1.1966103315353394, -0.36487746238708496, 0.466855525970459, 1.2985882759094238, 2.1303210258483887, 2.9620542526245117, 3.7937870025634766, 4.625519752502441, 5.457252502441406, 6.288985252380371, 7.120718479156494, 7.952451229095459, 8.784183502197266, 9.615917205810547, 10.447649955749512, 11.279382705688477, 12.111115455627441, 12.942848205566406, 13.774581909179688, 14.606313705444336, 15.438047409057617, 16.269779205322266, 17.101512908935547, 17.933246612548828, 18.76498031616211, 19.596712112426758, 20.42844581604004, 21.260177612304688, 22.09191131591797, 22.92364501953125, 23.7553768157959, 24.587108612060547]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 15.0, 18.0, 16.0, 32.0, 45.0, 67.0, 97.0, 144.0, 213.0, 315.0, 481.0, 736.0, 1097.0, 1604.0, 2505.0, 3557.0, 5300.0, 8082.0, 12363.0, 20033.0, 32894.0, 58627.0, 120909.0, 315600.0, 795236.0, 1258741.0, 883546.0, 370366.0, 141137.0, 64482.0, 36005.0, 21425.0, 13309.0, 8588.0, 5509.0, 3633.0, 2464.0, 1677.0, 1186.0, 796.0, 487.0, 340.0, 211.0, 141.0, 73.0, 64.0, 42.0, 30.0, 20.0, 11.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-33.6875, -32.62060546875, -31.5537109375, -30.48681640625, -29.419921875, -28.35302734375, -27.2861328125, -26.21923828125, -25.15234375, -24.08544921875, -23.0185546875, -21.95166015625, -20.884765625, -19.81787109375, -18.7509765625, -17.68408203125, -16.6171875, -15.55029296875, -14.4833984375, -13.41650390625, -12.349609375, -11.28271484375, -10.2158203125, -9.14892578125, -8.08203125, -7.01513671875, -5.9482421875, -4.88134765625, -3.814453125, -2.74755859375, -1.6806640625, -0.61376953125, 0.453125, 1.52001953125, 2.5869140625, 3.65380859375, 4.720703125, 5.78759765625, 6.8544921875, 7.92138671875, 8.98828125, 10.05517578125, 11.1220703125, 12.18896484375, 13.255859375, 14.32275390625, 15.3896484375, 16.45654296875, 17.5234375, 18.59033203125, 19.6572265625, 20.72412109375, 21.791015625, 22.85791015625, 23.9248046875, 24.99169921875, 26.05859375, 27.12548828125, 28.1923828125, 29.25927734375, 30.326171875, 31.39306640625, 32.4599609375, 33.52685546875, 34.59375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 7.0, 4.0, 6.0, 6.0, 6.0, 6.0, 15.0, 14.0, 17.0, 23.0, 16.0, 19.0, 25.0, 24.0, 21.0, 29.0, 35.0, 22.0, 38.0, 25.0, 48.0, 28.0, 32.0, 37.0, 38.0, 34.0, 38.0, 34.0, 40.0, 28.0, 23.0, 35.0, 23.0, 26.0, 22.0, 25.0, 21.0, 13.0, 23.0, 7.0, 16.0, 9.0, 10.0, 9.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-25.40625, -24.650146484375, -23.89404296875, -23.137939453125, -22.3818359375, -21.625732421875, -20.86962890625, -20.113525390625, -19.357421875, -18.601318359375, -17.84521484375, -17.089111328125, -16.3330078125, -15.576904296875, -14.82080078125, -14.064697265625, -13.30859375, -12.552490234375, -11.79638671875, -11.040283203125, -10.2841796875, -9.528076171875, -8.77197265625, -8.015869140625, -7.259765625, -6.503662109375, -5.74755859375, -4.991455078125, -4.2353515625, -3.479248046875, -2.72314453125, -1.967041015625, -1.2109375, -0.454833984375, 0.30126953125, 1.057373046875, 1.8134765625, 2.569580078125, 3.32568359375, 4.081787109375, 4.837890625, 5.593994140625, 6.35009765625, 7.106201171875, 7.8623046875, 8.618408203125, 9.37451171875, 10.130615234375, 10.88671875, 11.642822265625, 12.39892578125, 13.155029296875, 13.9111328125, 14.667236328125, 15.42333984375, 16.179443359375, 16.935546875, 17.691650390625, 18.44775390625, 19.203857421875, 19.9599609375, 20.716064453125, 21.47216796875, 22.228271484375, 22.984375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 11.0, 17.0, 27.0, 56.0, 66.0, 103.0, 173.0, 291.0, 470.0, 820.0, 1357.0, 2352.0, 4110.0, 7776.0, 14719.0, 29469.0, 61083.0, 137014.0, 346713.0, 1113030.0, 1634558.0, 497543.0, 184335.0, 80031.0, 37476.0, 18831.0, 9749.0, 5255.0, 2876.0, 1600.0, 905.0, 537.0, 319.0, 223.0, 137.0, 83.0, 57.0, 36.0, 19.0, 19.0, 8.0, 9.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.90625, -51.208984375, -49.51171875, -47.814453125, -46.1171875, -44.419921875, -42.72265625, -41.025390625, -39.328125, -37.630859375, -35.93359375, -34.236328125, -32.5390625, -30.841796875, -29.14453125, -27.447265625, -25.75, -24.052734375, -22.35546875, -20.658203125, -18.9609375, -17.263671875, -15.56640625, -13.869140625, -12.171875, -10.474609375, -8.77734375, -7.080078125, -5.3828125, -3.685546875, -1.98828125, -0.291015625, 1.40625, 3.103515625, 4.80078125, 6.498046875, 8.1953125, 9.892578125, 11.58984375, 13.287109375, 14.984375, 16.681640625, 18.37890625, 20.076171875, 21.7734375, 23.470703125, 25.16796875, 26.865234375, 28.5625, 30.259765625, 31.95703125, 33.654296875, 35.3515625, 37.048828125, 38.74609375, 40.443359375, 42.140625, 43.837890625, 45.53515625, 47.232421875, 48.9296875, 50.626953125, 52.32421875, 54.021484375, 55.71875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 6.0, 9.0, 4.0, 4.0, 7.0, 14.0, 23.0, 22.0, 25.0, 31.0, 51.0, 65.0, 91.0, 93.0, 105.0, 125.0, 155.0, 248.0, 289.0, 379.0, 457.0, 374.0, 302.0, 253.0, 200.0, 157.0, 115.0, 90.0, 74.0, 61.0, 61.0, 32.0, 33.0, 32.0, 26.0, 16.0, 10.0, 8.0, 6.0, 8.0, 1.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.8853759765625, -11.419189453125, -10.9530029296875, -10.48681640625, -10.0206298828125, -9.554443359375, -9.0882568359375, -8.6220703125, -8.1558837890625, -7.689697265625, -7.2235107421875, -6.75732421875, -6.2911376953125, -5.824951171875, -5.3587646484375, -4.892578125, -4.4263916015625, -3.960205078125, -3.4940185546875, -3.02783203125, -2.5616455078125, -2.095458984375, -1.6292724609375, -1.1630859375, -0.6968994140625, -0.230712890625, 0.2354736328125, 0.70166015625, 1.1678466796875, 1.634033203125, 2.1002197265625, 2.56640625, 3.0325927734375, 3.498779296875, 3.9649658203125, 4.43115234375, 4.8973388671875, 5.363525390625, 5.8297119140625, 6.2958984375, 6.7620849609375, 7.228271484375, 7.6944580078125, 8.16064453125, 8.6268310546875, 9.093017578125, 9.5592041015625, 10.025390625, 10.4915771484375, 10.957763671875, 11.4239501953125, 11.89013671875, 12.3563232421875, 12.822509765625, 13.2886962890625, 13.7548828125, 14.2210693359375, 14.687255859375, 15.1534423828125, 15.61962890625, 16.0858154296875, 16.552001953125, 17.0181884765625, 17.484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 11.0, 3.0, 14.0, 6.0, 5.0, 14.0, 18.0, 16.0, 24.0, 21.0, 34.0, 31.0, 32.0, 50.0, 49.0, 52.0, 54.0, 72.0, 53.0, 65.0, 59.0, 61.0, 46.0, 42.0, 27.0, 24.0, 17.0, 19.0, 11.0, 12.0, 14.0, 7.0, 10.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-30.91046142578125, -29.837297439575195, -28.76413345336914, -27.690969467163086, -26.61780548095703, -25.54464340209961, -24.471479415893555, -23.3983154296875, -22.325151443481445, -21.25198745727539, -20.178823471069336, -19.10565948486328, -18.03249740600586, -16.959331512451172, -15.88616943359375, -14.813005447387695, -13.73984146118164, -12.666677474975586, -11.593513488769531, -10.520350456237793, -9.447186470031738, -8.374022483825684, -7.300858974456787, -6.227695465087891, -5.154531478881836, -4.081367492675781, -3.0082039833068848, -1.9350402355194092, -0.8618764877319336, 0.2112874984741211, 1.2844510078430176, 2.357614517211914, 3.4307823181152344, 4.503946304321289, 5.5771098136901855, 6.650273323059082, 7.723437309265137, 8.796601295471191, 9.86976432800293, 10.942928314208984, 12.016092300415039, 13.089256286621094, 14.162420272827148, 15.235583305358887, 16.308746337890625, 17.381912231445312, 18.455074310302734, 19.52823829650879, 20.601402282714844, 21.6745662689209, 22.747730255126953, 23.820894241333008, 24.894058227539062, 25.967220306396484, 27.04038429260254, 28.113548278808594, 29.18671226501465, 30.259876251220703, 31.333040237426758, 32.40620422363281, 33.479366302490234, 34.55253219604492, 35.625694274902344, 36.69886016845703, 37.77202224731445]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 8.0, 7.0, 16.0, 16.0, 18.0, 26.0, 20.0, 18.0, 32.0, 23.0, 33.0, 36.0, 31.0, 36.0, 40.0, 39.0, 37.0, 49.0, 37.0, 36.0, 31.0, 37.0, 36.0, 37.0, 31.0, 36.0, 34.0, 20.0, 30.0, 24.0, 19.0, 13.0, 16.0, 15.0, 13.0, 8.0, 9.0, 2.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.769123077392578, -28.83692741394043, -27.90473175048828, -26.972537994384766, -26.040342330932617, -25.10814666748047, -24.17595100402832, -23.243755340576172, -22.311561584472656, -21.379365921020508, -20.44717025756836, -19.514976501464844, -18.582780838012695, -17.650585174560547, -16.7183895111084, -15.78619384765625, -14.853998184204102, -13.921802520751953, -12.989607810974121, -12.057412147521973, -11.12521743774414, -10.193021774291992, -9.260826110839844, -8.328630447387695, -7.396435737609863, -6.464240550994873, -5.532045364379883, -4.599849700927734, -3.667654514312744, -2.735459327697754, -1.8032636642456055, -0.8710684776306152, 0.06112480163574219, 0.993320107460022, 1.9255154132843018, 2.857710838317871, 3.7899060249328613, 4.722101211547852, 5.654296875, 6.58649206161499, 7.5186872482299805, 8.450882911682129, 9.383077621459961, 10.31527328491211, 11.247468948364258, 12.17966365814209, 13.111859321594238, 14.04405403137207, 14.976249694824219, 15.908445358276367, 16.840641021728516, 17.77283477783203, 18.70503044128418, 19.637226104736328, 20.569421768188477, 21.501617431640625, 22.43381118774414, 23.36600685119629, 24.298202514648438, 25.230396270751953, 26.1625919342041, 27.09478759765625, 28.0269832611084, 28.959178924560547, 29.891374588012695]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 12.0, 13.0, 11.0, 22.0, 39.0, 44.0, 82.0, 108.0, 150.0, 212.0, 312.0, 466.0, 709.0, 1027.0, 1551.0, 2240.0, 3424.0, 5133.0, 7858.0, 12162.0, 19079.0, 29745.0, 48122.0, 78486.0, 127820.0, 192305.0, 189134.0, 123635.0, 75381.0, 46811.0, 29256.0, 18435.0, 11953.0, 7690.0, 5013.0, 3284.0, 2177.0, 1468.0, 995.0, 708.0, 464.0, 338.0, 227.0, 147.0, 89.0, 69.0, 51.0, 26.0, 21.0, 21.0, 9.0, 12.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0], "bins": [-22.9375, -22.219970703125, -21.50244140625, -20.784912109375, -20.0673828125, -19.349853515625, -18.63232421875, -17.914794921875, -17.197265625, -16.479736328125, -15.76220703125, -15.044677734375, -14.3271484375, -13.609619140625, -12.89208984375, -12.174560546875, -11.45703125, -10.739501953125, -10.02197265625, -9.304443359375, -8.5869140625, -7.869384765625, -7.15185546875, -6.434326171875, -5.716796875, -4.999267578125, -4.28173828125, -3.564208984375, -2.8466796875, -2.129150390625, -1.41162109375, -0.694091796875, 0.0234375, 0.740966796875, 1.45849609375, 2.176025390625, 2.8935546875, 3.611083984375, 4.32861328125, 5.046142578125, 5.763671875, 6.481201171875, 7.19873046875, 7.916259765625, 8.6337890625, 9.351318359375, 10.06884765625, 10.786376953125, 11.50390625, 12.221435546875, 12.93896484375, 13.656494140625, 14.3740234375, 15.091552734375, 15.80908203125, 16.526611328125, 17.244140625, 17.961669921875, 18.67919921875, 19.396728515625, 20.1142578125, 20.831787109375, 21.54931640625, 22.266845703125, 22.984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 4.0, 3.0, 7.0, 16.0, 15.0, 16.0, 24.0, 16.0, 26.0, 34.0, 32.0, 24.0, 33.0, 28.0, 39.0, 42.0, 42.0, 40.0, 43.0, 53.0, 39.0, 32.0, 34.0, 33.0, 36.0, 44.0, 36.0, 33.0, 29.0, 26.0, 20.0, 21.0, 10.0, 14.0, 15.0, 10.0, 7.0, 6.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.738037109375, -29.74169921875, -28.745361328125, -27.7490234375, -26.752685546875, -25.75634765625, -24.760009765625, -23.763671875, -22.767333984375, -21.77099609375, -20.774658203125, -19.7783203125, -18.781982421875, -17.78564453125, -16.789306640625, -15.79296875, -14.796630859375, -13.80029296875, -12.803955078125, -11.8076171875, -10.811279296875, -9.81494140625, -8.818603515625, -7.822265625, -6.825927734375, -5.82958984375, -4.833251953125, -3.8369140625, -2.840576171875, -1.84423828125, -0.847900390625, 0.1484375, 1.144775390625, 2.14111328125, 3.137451171875, 4.1337890625, 5.130126953125, 6.12646484375, 7.122802734375, 8.119140625, 9.115478515625, 10.11181640625, 11.108154296875, 12.1044921875, 13.100830078125, 14.09716796875, 15.093505859375, 16.08984375, 17.086181640625, 18.08251953125, 19.078857421875, 20.0751953125, 21.071533203125, 22.06787109375, 23.064208984375, 24.060546875, 25.056884765625, 26.05322265625, 27.049560546875, 28.0458984375, 29.042236328125, 30.03857421875, 31.034912109375, 32.03125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 7.0, 9.0, 12.0, 17.0, 30.0, 29.0, 48.0, 66.0, 101.0, 153.0, 194.0, 287.0, 423.0, 645.0, 984.0, 1592.0, 2490.0, 3977.0, 6738.0, 11371.0, 20600.0, 38926.0, 80717.0, 185181.0, 327926.0, 191314.0, 83592.0, 40478.0, 20975.0, 11687.0, 6741.0, 3978.0, 2531.0, 1638.0, 1026.0, 648.0, 440.0, 292.0, 208.0, 146.0, 104.0, 71.0, 53.0, 28.0, 26.0, 21.0, 11.0, 8.0, 7.0, 4.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.0625, -35.84814453125, -34.6337890625, -33.41943359375, -32.205078125, -30.99072265625, -29.7763671875, -28.56201171875, -27.34765625, -26.13330078125, -24.9189453125, -23.70458984375, -22.490234375, -21.27587890625, -20.0615234375, -18.84716796875, -17.6328125, -16.41845703125, -15.2041015625, -13.98974609375, -12.775390625, -11.56103515625, -10.3466796875, -9.13232421875, -7.91796875, -6.70361328125, -5.4892578125, -4.27490234375, -3.060546875, -1.84619140625, -0.6318359375, 0.58251953125, 1.796875, 3.01123046875, 4.2255859375, 5.43994140625, 6.654296875, 7.86865234375, 9.0830078125, 10.29736328125, 11.51171875, 12.72607421875, 13.9404296875, 15.15478515625, 16.369140625, 17.58349609375, 18.7978515625, 20.01220703125, 21.2265625, 22.44091796875, 23.6552734375, 24.86962890625, 26.083984375, 27.29833984375, 28.5126953125, 29.72705078125, 30.94140625, 32.15576171875, 33.3701171875, 34.58447265625, 35.798828125, 37.01318359375, 38.2275390625, 39.44189453125, 40.65625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 6.0, 8.0, 15.0, 11.0, 15.0, 10.0, 13.0, 24.0, 25.0, 16.0, 27.0, 43.0, 25.0, 36.0, 32.0, 39.0, 39.0, 48.0, 24.0, 34.0, 43.0, 35.0, 39.0, 36.0, 37.0, 44.0, 40.0, 33.0, 32.0, 31.0, 29.0, 18.0, 12.0, 16.0, 11.0, 6.0, 15.0, 6.0, 5.0, 9.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.578125, -20.93798828125, -20.2978515625, -19.65771484375, -19.017578125, -18.37744140625, -17.7373046875, -17.09716796875, -16.45703125, -15.81689453125, -15.1767578125, -14.53662109375, -13.896484375, -13.25634765625, -12.6162109375, -11.97607421875, -11.3359375, -10.69580078125, -10.0556640625, -9.41552734375, -8.775390625, -8.13525390625, -7.4951171875, -6.85498046875, -6.21484375, -5.57470703125, -4.9345703125, -4.29443359375, -3.654296875, -3.01416015625, -2.3740234375, -1.73388671875, -1.09375, -0.45361328125, 0.1865234375, 0.82666015625, 1.466796875, 2.10693359375, 2.7470703125, 3.38720703125, 4.02734375, 4.66748046875, 5.3076171875, 5.94775390625, 6.587890625, 7.22802734375, 7.8681640625, 8.50830078125, 9.1484375, 9.78857421875, 10.4287109375, 11.06884765625, 11.708984375, 12.34912109375, 12.9892578125, 13.62939453125, 14.26953125, 14.90966796875, 15.5498046875, 16.18994140625, 16.830078125, 17.47021484375, 18.1103515625, 18.75048828125, 19.390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 15.0, 11.0, 16.0, 30.0, 33.0, 46.0, 58.0, 102.0, 133.0, 184.0, 300.0, 436.0, 713.0, 1143.0, 1894.0, 3376.0, 6278.0, 12230.0, 27807.0, 77434.0, 286475.0, 435226.0, 120734.0, 39262.0, 16287.0, 7794.0, 4218.0, 2442.0, 1354.0, 849.0, 555.0, 361.0, 225.0, 165.0, 104.0, 58.0, 57.0, 33.0, 26.0, 18.0, 19.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.6484375, -15.1466064453125, -14.644775390625, -14.1429443359375, -13.64111328125, -13.1392822265625, -12.637451171875, -12.1356201171875, -11.6337890625, -11.1319580078125, -10.630126953125, -10.1282958984375, -9.62646484375, -9.1246337890625, -8.622802734375, -8.1209716796875, -7.619140625, -7.1173095703125, -6.615478515625, -6.1136474609375, -5.61181640625, -5.1099853515625, -4.608154296875, -4.1063232421875, -3.6044921875, -3.1026611328125, -2.600830078125, -2.0989990234375, -1.59716796875, -1.0953369140625, -0.593505859375, -0.0916748046875, 0.41015625, 0.9119873046875, 1.413818359375, 1.9156494140625, 2.41748046875, 2.9193115234375, 3.421142578125, 3.9229736328125, 4.4248046875, 4.9266357421875, 5.428466796875, 5.9302978515625, 6.43212890625, 6.9339599609375, 7.435791015625, 7.9376220703125, 8.439453125, 8.9412841796875, 9.443115234375, 9.9449462890625, 10.44677734375, 10.9486083984375, 11.450439453125, 11.9522705078125, 12.4541015625, 12.9559326171875, 13.457763671875, 13.9595947265625, 14.46142578125, 14.9632568359375, 15.465087890625, 15.9669189453125, 16.46875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 15.0, 14.0, 18.0, 35.0, 41.0, 81.0, 87.0, 148.0, 159.0, 115.0, 96.0, 56.0, 37.0, 27.0, 19.0, 13.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018739700317382812, -0.0018118172883987427, -0.001749664545059204, -0.0016875118017196655, -0.001625359058380127, -0.0015632063150405884, -0.0015010535717010498, -0.0014389008283615112, -0.0013767480850219727, -0.001314595341682434, -0.0012524425983428955, -0.001190289855003357, -0.0011281371116638184, -0.0010659843683242798, -0.0010038316249847412, -0.0009416788816452026, -0.0008795261383056641, -0.0008173733949661255, -0.0007552206516265869, -0.0006930679082870483, -0.0006309151649475098, -0.0005687624216079712, -0.0005066096782684326, -0.00044445693492889404, -0.00038230419158935547, -0.0003201514482498169, -0.0002579987049102783, -0.00019584596157073975, -0.00013369321823120117, -7.15404748916626e-05, -9.387731552124023e-06, 5.276501178741455e-05, 0.00011491775512695312, 0.0001770704984664917, 0.00023922324180603027, 0.00030137598514556885, 0.0003635287284851074, 0.000425681471824646, 0.00048783421516418457, 0.0005499869585037231, 0.0006121397018432617, 0.0006742924451828003, 0.0007364451885223389, 0.0007985979318618774, 0.000860750675201416, 0.0009229034185409546, 0.0009850561618804932, 0.0010472089052200317, 0.0011093616485595703, 0.0011715143918991089, 0.0012336671352386475, 0.001295819878578186, 0.0013579726219177246, 0.0014201253652572632, 0.0014822781085968018, 0.0015444308519363403, 0.001606583595275879, 0.0016687363386154175, 0.001730889081954956, 0.0017930418252944946, 0.0018551945686340332, 0.0019173473119735718, 0.0019795000553131104, 0.002041652798652649, 0.0021038055419921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 10.0, 18.0, 21.0, 29.0, 45.0, 79.0, 119.0, 134.0, 208.0, 363.0, 427.0, 713.0, 1147.0, 1743.0, 2782.0, 4729.0, 7822.0, 14249.0, 27808.0, 60494.0, 153811.0, 334810.0, 250617.0, 98027.0, 41014.0, 20323.0, 10889.0, 6058.0, 3624.0, 2217.0, 1441.0, 892.0, 603.0, 412.0, 286.0, 174.0, 129.0, 86.0, 62.0, 41.0, 22.0, 25.0, 17.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-15.21875, -14.781005859375, -14.34326171875, -13.905517578125, -13.4677734375, -13.030029296875, -12.59228515625, -12.154541015625, -11.716796875, -11.279052734375, -10.84130859375, -10.403564453125, -9.9658203125, -9.528076171875, -9.09033203125, -8.652587890625, -8.21484375, -7.777099609375, -7.33935546875, -6.901611328125, -6.4638671875, -6.026123046875, -5.58837890625, -5.150634765625, -4.712890625, -4.275146484375, -3.83740234375, -3.399658203125, -2.9619140625, -2.524169921875, -2.08642578125, -1.648681640625, -1.2109375, -0.773193359375, -0.33544921875, 0.102294921875, 0.5400390625, 0.977783203125, 1.41552734375, 1.853271484375, 2.291015625, 2.728759765625, 3.16650390625, 3.604248046875, 4.0419921875, 4.479736328125, 4.91748046875, 5.355224609375, 5.79296875, 6.230712890625, 6.66845703125, 7.106201171875, 7.5439453125, 7.981689453125, 8.41943359375, 8.857177734375, 9.294921875, 9.732666015625, 10.17041015625, 10.608154296875, 11.0458984375, 11.483642578125, 11.92138671875, 12.359130859375, 12.796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 7.0, 7.0, 5.0, 7.0, 7.0, 15.0, 16.0, 25.0, 24.0, 34.0, 52.0, 79.0, 63.0, 86.0, 71.0, 88.0, 82.0, 74.0, 61.0, 36.0, 21.0, 28.0, 24.0, 13.0, 11.0, 9.0, 8.0, 8.0, 5.0, 6.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4296875, -4.284912109375, -4.14013671875, -3.995361328125, -3.8505859375, -3.705810546875, -3.56103515625, -3.416259765625, -3.271484375, -3.126708984375, -2.98193359375, -2.837158203125, -2.6923828125, -2.547607421875, -2.40283203125, -2.258056640625, -2.11328125, -1.968505859375, -1.82373046875, -1.678955078125, -1.5341796875, -1.389404296875, -1.24462890625, -1.099853515625, -0.955078125, -0.810302734375, -0.66552734375, -0.520751953125, -0.3759765625, -0.231201171875, -0.08642578125, 0.058349609375, 0.203125, 0.347900390625, 0.49267578125, 0.637451171875, 0.7822265625, 0.927001953125, 1.07177734375, 1.216552734375, 1.361328125, 1.506103515625, 1.65087890625, 1.795654296875, 1.9404296875, 2.085205078125, 2.22998046875, 2.374755859375, 2.51953125, 2.664306640625, 2.80908203125, 2.953857421875, 3.0986328125, 3.243408203125, 3.38818359375, 3.532958984375, 3.677734375, 3.822509765625, 3.96728515625, 4.112060546875, 4.2568359375, 4.401611328125, 4.54638671875, 4.691162109375, 4.8359375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 8.0, 10.0, 7.0, 9.0, 12.0, 15.0, 21.0, 16.0, 23.0, 32.0, 22.0, 34.0, 32.0, 47.0, 54.0, 65.0, 61.0, 70.0, 51.0, 64.0, 43.0, 49.0, 41.0, 37.0, 30.0, 22.0, 23.0, 16.0, 17.0, 9.0, 12.0, 7.0, 5.0, 7.0, 5.0, 4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.662500381469727, -27.651273727416992, -26.64004898071289, -25.628822326660156, -24.617595672607422, -23.606369018554688, -22.595144271850586, -21.58391761779785, -20.57269287109375, -19.561466217041016, -18.550241470336914, -17.53901481628418, -16.527788162231445, -15.516562461853027, -14.50533676147461, -13.494110107421875, -12.48288345336914, -11.471657752990723, -10.460431098937988, -9.44920539855957, -8.437978744506836, -7.426753044128418, -6.41552734375, -5.404301166534424, -4.393074989318848, -3.3818488121032715, -2.3706228733062744, -1.3593969345092773, -0.34817075729370117, 0.663055419921875, 1.674281120300293, 2.685507297515869, 3.696735382080078, 4.707961559295654, 5.7191877365112305, 6.730413436889648, 7.741639614105225, 8.7528657913208, 9.764091491699219, 10.775318145751953, 11.786543846130371, 12.797769546508789, 13.808996200561523, 14.820221900939941, 15.83144760131836, 16.842674255371094, 17.853900909423828, 18.86512565612793, 19.876352310180664, 20.8875789642334, 21.8988037109375, 22.910030364990234, 23.92125701904297, 24.932483673095703, 25.943708419799805, 26.95493507385254, 27.96615982055664, 28.977386474609375, 29.988611221313477, 30.99983787536621, 32.01106262207031, 33.02228927612305, 34.03351593017578, 35.044742584228516, 36.05596923828125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 11.0, 4.0, 10.0, 8.0, 14.0, 20.0, 23.0, 23.0, 25.0, 23.0, 30.0, 26.0, 27.0, 35.0, 35.0, 43.0, 27.0, 47.0, 38.0, 40.0, 40.0, 30.0, 39.0, 34.0, 42.0, 32.0, 35.0, 36.0, 23.0, 25.0, 32.0, 25.0, 10.0, 16.0, 11.0, 16.0, 12.0, 11.0, 6.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-29.438772201538086, -28.533864974975586, -27.628957748413086, -26.724050521850586, -25.819143295288086, -24.914236068725586, -24.009328842163086, -23.104421615600586, -22.199514389038086, -21.294607162475586, -20.389699935913086, -19.484792709350586, -18.579885482788086, -17.674978256225586, -16.770071029663086, -15.865163803100586, -14.96025562286377, -14.05534839630127, -13.15044116973877, -12.24553394317627, -11.34062671661377, -10.435718536376953, -9.530811309814453, -8.625904083251953, -7.720997333526611, -6.816090106964111, -5.911182880401611, -5.006275177001953, -4.101367950439453, -3.196460723876953, -2.291553497314453, -1.3866462707519531, -0.4817390441894531, 0.42316824197769165, 1.3280755281448364, 2.232982873916626, 3.137890100479126, 4.042797565460205, 4.947704792022705, 5.852612018585205, 6.757519245147705, 7.662426471710205, 8.567334175109863, 9.472241401672363, 10.377148628234863, 11.282055854797363, 12.186963081359863, 13.091870307922363, 13.996777534484863, 14.901684761047363, 15.806591987609863, 16.71150016784668, 17.61640739440918, 18.52131462097168, 19.42622184753418, 20.33112907409668, 21.23603630065918, 22.14094352722168, 23.04585075378418, 23.95075798034668, 24.85566520690918, 25.76057243347168, 26.66547966003418, 27.57038688659668, 28.47529411315918]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 13.0, 13.0, 18.0, 46.0, 56.0, 94.0, 118.0, 212.0, 264.0, 460.0, 700.0, 1208.0, 1735.0, 2766.0, 4426.0, 6932.0, 11013.0, 17526.0, 28044.0, 45617.0, 72881.0, 115724.0, 169015.0, 187846.0, 140297.0, 91082.0, 55964.0, 35287.0, 21762.0, 13875.0, 8596.0, 5464.0, 3345.0, 2179.0, 1433.0, 923.0, 568.0, 380.0, 215.0, 152.0, 99.0, 82.0, 50.0, 24.0, 17.0, 10.0, 9.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.71875, -33.6416015625, -32.564453125, -31.4873046875, -30.41015625, -29.3330078125, -28.255859375, -27.1787109375, -26.1015625, -25.0244140625, -23.947265625, -22.8701171875, -21.79296875, -20.7158203125, -19.638671875, -18.5615234375, -17.484375, -16.4072265625, -15.330078125, -14.2529296875, -13.17578125, -12.0986328125, -11.021484375, -9.9443359375, -8.8671875, -7.7900390625, -6.712890625, -5.6357421875, -4.55859375, -3.4814453125, -2.404296875, -1.3271484375, -0.25, 0.8271484375, 1.904296875, 2.9814453125, 4.05859375, 5.1357421875, 6.212890625, 7.2900390625, 8.3671875, 9.4443359375, 10.521484375, 11.5986328125, 12.67578125, 13.7529296875, 14.830078125, 15.9072265625, 16.984375, 18.0615234375, 19.138671875, 20.2158203125, 21.29296875, 22.3701171875, 23.447265625, 24.5244140625, 25.6015625, 26.6787109375, 27.755859375, 28.8330078125, 29.91015625, 30.9873046875, 32.064453125, 33.1416015625, 34.21875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 13.0, 6.0, 9.0, 5.0, 13.0, 15.0, 25.0, 26.0, 14.0, 24.0, 29.0, 25.0, 28.0, 36.0, 41.0, 41.0, 30.0, 31.0, 31.0, 45.0, 51.0, 40.0, 36.0, 31.0, 36.0, 36.0, 46.0, 30.0, 33.0, 22.0, 24.0, 26.0, 19.0, 13.0, 19.0, 16.0, 12.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-31.234375, -30.31689453125, -29.3994140625, -28.48193359375, -27.564453125, -26.64697265625, -25.7294921875, -24.81201171875, -23.89453125, -22.97705078125, -22.0595703125, -21.14208984375, -20.224609375, -19.30712890625, -18.3896484375, -17.47216796875, -16.5546875, -15.63720703125, -14.7197265625, -13.80224609375, -12.884765625, -11.96728515625, -11.0498046875, -10.13232421875, -9.21484375, -8.29736328125, -7.3798828125, -6.46240234375, -5.544921875, -4.62744140625, -3.7099609375, -2.79248046875, -1.875, -0.95751953125, -0.0400390625, 0.87744140625, 1.794921875, 2.71240234375, 3.6298828125, 4.54736328125, 5.46484375, 6.38232421875, 7.2998046875, 8.21728515625, 9.134765625, 10.05224609375, 10.9697265625, 11.88720703125, 12.8046875, 13.72216796875, 14.6396484375, 15.55712890625, 16.474609375, 17.39208984375, 18.3095703125, 19.22705078125, 20.14453125, 21.06201171875, 21.9794921875, 22.89697265625, 23.814453125, 24.73193359375, 25.6494140625, 26.56689453125, 27.484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 11.0, 22.0, 26.0, 34.0, 62.0, 101.0, 139.0, 271.0, 411.0, 708.0, 1132.0, 2097.0, 3602.0, 6459.0, 11792.0, 22277.0, 42685.0, 86421.0, 174303.0, 278965.0, 205499.0, 103223.0, 51100.0, 25981.0, 13821.0, 7483.0, 4117.0, 2372.0, 1388.0, 839.0, 453.0, 262.0, 189.0, 104.0, 80.0, 43.0, 28.0, 18.0, 18.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.46875, -47.853515625, -46.23828125, -44.623046875, -43.0078125, -41.392578125, -39.77734375, -38.162109375, -36.546875, -34.931640625, -33.31640625, -31.701171875, -30.0859375, -28.470703125, -26.85546875, -25.240234375, -23.625, -22.009765625, -20.39453125, -18.779296875, -17.1640625, -15.548828125, -13.93359375, -12.318359375, -10.703125, -9.087890625, -7.47265625, -5.857421875, -4.2421875, -2.626953125, -1.01171875, 0.603515625, 2.21875, 3.833984375, 5.44921875, 7.064453125, 8.6796875, 10.294921875, 11.91015625, 13.525390625, 15.140625, 16.755859375, 18.37109375, 19.986328125, 21.6015625, 23.216796875, 24.83203125, 26.447265625, 28.0625, 29.677734375, 31.29296875, 32.908203125, 34.5234375, 36.138671875, 37.75390625, 39.369140625, 40.984375, 42.599609375, 44.21484375, 45.830078125, 47.4453125, 49.060546875, 50.67578125, 52.291015625, 53.90625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 2.0, 2.0, 9.0, 7.0, 18.0, 13.0, 16.0, 11.0, 23.0, 25.0, 20.0, 31.0, 38.0, 32.0, 35.0, 37.0, 59.0, 52.0, 41.0, 40.0, 53.0, 38.0, 46.0, 49.0, 32.0, 34.0, 35.0, 36.0, 20.0, 16.0, 21.0, 23.0, 17.0, 12.0, 15.0, 12.0, 5.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.890625, -20.250732421875, -19.61083984375, -18.970947265625, -18.3310546875, -17.691162109375, -17.05126953125, -16.411376953125, -15.771484375, -15.131591796875, -14.49169921875, -13.851806640625, -13.2119140625, -12.572021484375, -11.93212890625, -11.292236328125, -10.65234375, -10.012451171875, -9.37255859375, -8.732666015625, -8.0927734375, -7.452880859375, -6.81298828125, -6.173095703125, -5.533203125, -4.893310546875, -4.25341796875, -3.613525390625, -2.9736328125, -2.333740234375, -1.69384765625, -1.053955078125, -0.4140625, 0.225830078125, 0.86572265625, 1.505615234375, 2.1455078125, 2.785400390625, 3.42529296875, 4.065185546875, 4.705078125, 5.344970703125, 5.98486328125, 6.624755859375, 7.2646484375, 7.904541015625, 8.54443359375, 9.184326171875, 9.82421875, 10.464111328125, 11.10400390625, 11.743896484375, 12.3837890625, 13.023681640625, 13.66357421875, 14.303466796875, 14.943359375, 15.583251953125, 16.22314453125, 16.863037109375, 17.5029296875, 18.142822265625, 18.78271484375, 19.422607421875, 20.0625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 11.0, 11.0, 18.0, 26.0, 26.0, 33.0, 54.0, 78.0, 94.0, 117.0, 171.0, 260.0, 353.0, 507.0, 740.0, 1143.0, 1831.0, 3001.0, 5140.0, 9083.0, 18024.0, 37542.0, 85294.0, 206669.0, 336021.0, 190600.0, 78129.0, 34960.0, 16904.0, 8737.0, 4892.0, 2818.0, 1760.0, 1064.0, 706.0, 507.0, 355.0, 244.0, 174.0, 116.0, 105.0, 60.0, 45.0, 37.0, 36.0, 15.0, 11.0, 14.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.59375, -19.91748046875, -19.2412109375, -18.56494140625, -17.888671875, -17.21240234375, -16.5361328125, -15.85986328125, -15.18359375, -14.50732421875, -13.8310546875, -13.15478515625, -12.478515625, -11.80224609375, -11.1259765625, -10.44970703125, -9.7734375, -9.09716796875, -8.4208984375, -7.74462890625, -7.068359375, -6.39208984375, -5.7158203125, -5.03955078125, -4.36328125, -3.68701171875, -3.0107421875, -2.33447265625, -1.658203125, -0.98193359375, -0.3056640625, 0.37060546875, 1.046875, 1.72314453125, 2.3994140625, 3.07568359375, 3.751953125, 4.42822265625, 5.1044921875, 5.78076171875, 6.45703125, 7.13330078125, 7.8095703125, 8.48583984375, 9.162109375, 9.83837890625, 10.5146484375, 11.19091796875, 11.8671875, 12.54345703125, 13.2197265625, 13.89599609375, 14.572265625, 15.24853515625, 15.9248046875, 16.60107421875, 17.27734375, 17.95361328125, 18.6298828125, 19.30615234375, 19.982421875, 20.65869140625, 21.3349609375, 22.01123046875, 22.6875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 10.0, 16.0, 26.0, 33.0, 60.0, 78.0, 90.0, 137.0, 126.0, 108.0, 80.0, 66.0, 36.0, 38.0, 11.0, 19.0, 11.0, 9.0, 7.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0028972625732421875, -0.0028096139430999756, -0.0027219653129577637, -0.0026343166828155518, -0.00254666805267334, -0.002459019422531128, -0.002371370792388916, -0.002283722162246704, -0.002196073532104492, -0.0021084249019622803, -0.0020207762718200684, -0.0019331276416778564, -0.0018454790115356445, -0.0017578303813934326, -0.0016701817512512207, -0.0015825331211090088, -0.0014948844909667969, -0.001407235860824585, -0.001319587230682373, -0.0012319386005401611, -0.0011442899703979492, -0.0010566413402557373, -0.0009689927101135254, -0.0008813440799713135, -0.0007936954498291016, -0.0007060468196868896, -0.0006183981895446777, -0.0005307495594024658, -0.0004431009292602539, -0.000355452299118042, -0.0002678036689758301, -0.00018015503883361816, -9.250640869140625e-05, -4.857778549194336e-06, 8.279085159301758e-05, 0.0001704394817352295, 0.0002580881118774414, 0.0003457367420196533, 0.00043338537216186523, 0.0005210340023040771, 0.0006086826324462891, 0.000696331262588501, 0.0007839798927307129, 0.0008716285228729248, 0.0009592771530151367, 0.0010469257831573486, 0.0011345744132995605, 0.0012222230434417725, 0.0013098716735839844, 0.0013975203037261963, 0.0014851689338684082, 0.0015728175640106201, 0.001660466194152832, 0.001748114824295044, 0.0018357634544372559, 0.0019234120845794678, 0.0020110607147216797, 0.0020987093448638916, 0.0021863579750061035, 0.0022740066051483154, 0.0023616552352905273, 0.0024493038654327393, 0.002536952495574951, 0.002624601125717163, 0.002712249755859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 5.0, 9.0, 7.0, 8.0, 13.0, 16.0, 33.0, 28.0, 38.0, 52.0, 97.0, 146.0, 250.0, 419.0, 661.0, 1118.0, 1947.0, 3390.0, 6399.0, 12480.0, 26415.0, 58982.0, 137365.0, 289205.0, 276118.0, 127457.0, 55422.0, 24742.0, 11874.0, 6008.0, 3260.0, 1867.0, 1044.0, 612.0, 379.0, 219.0, 156.0, 100.0, 77.0, 43.0, 33.0, 17.0, 13.0, 12.0, 12.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.828125, -19.166259765625, -18.50439453125, -17.842529296875, -17.1806640625, -16.518798828125, -15.85693359375, -15.195068359375, -14.533203125, -13.871337890625, -13.20947265625, -12.547607421875, -11.8857421875, -11.223876953125, -10.56201171875, -9.900146484375, -9.23828125, -8.576416015625, -7.91455078125, -7.252685546875, -6.5908203125, -5.928955078125, -5.26708984375, -4.605224609375, -3.943359375, -3.281494140625, -2.61962890625, -1.957763671875, -1.2958984375, -0.634033203125, 0.02783203125, 0.689697265625, 1.3515625, 2.013427734375, 2.67529296875, 3.337158203125, 3.9990234375, 4.660888671875, 5.32275390625, 5.984619140625, 6.646484375, 7.308349609375, 7.97021484375, 8.632080078125, 9.2939453125, 9.955810546875, 10.61767578125, 11.279541015625, 11.94140625, 12.603271484375, 13.26513671875, 13.927001953125, 14.5888671875, 15.250732421875, 15.91259765625, 16.574462890625, 17.236328125, 17.898193359375, 18.56005859375, 19.221923828125, 19.8837890625, 20.545654296875, 21.20751953125, 21.869384765625, 22.53125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 7.0, 16.0, 16.0, 17.0, 32.0, 32.0, 35.0, 50.0, 50.0, 66.0, 56.0, 71.0, 79.0, 83.0, 84.0, 57.0, 46.0, 41.0, 32.0, 34.0, 17.0, 13.0, 12.0, 13.0, 6.0, 7.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.22869873046875, -4.0355224609375, -3.84234619140625, -3.649169921875, -3.45599365234375, -3.2628173828125, -3.06964111328125, -2.87646484375, -2.68328857421875, -2.4901123046875, -2.29693603515625, -2.103759765625, -1.91058349609375, -1.7174072265625, -1.52423095703125, -1.3310546875, -1.13787841796875, -0.9447021484375, -0.75152587890625, -0.558349609375, -0.36517333984375, -0.1719970703125, 0.02117919921875, 0.21435546875, 0.40753173828125, 0.6007080078125, 0.79388427734375, 0.987060546875, 1.18023681640625, 1.3734130859375, 1.56658935546875, 1.759765625, 1.95294189453125, 2.1461181640625, 2.33929443359375, 2.532470703125, 2.72564697265625, 2.9188232421875, 3.11199951171875, 3.30517578125, 3.49835205078125, 3.6915283203125, 3.88470458984375, 4.077880859375, 4.27105712890625, 4.4642333984375, 4.65740966796875, 4.8505859375, 5.04376220703125, 5.2369384765625, 5.43011474609375, 5.623291015625, 5.81646728515625, 6.0096435546875, 6.20281982421875, 6.39599609375, 6.58917236328125, 6.7823486328125, 6.97552490234375, 7.168701171875, 7.36187744140625, 7.5550537109375, 7.74822998046875, 7.94140625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 6.0, 11.0, 5.0, 9.0, 15.0, 20.0, 16.0, 18.0, 30.0, 33.0, 28.0, 41.0, 35.0, 50.0, 45.0, 59.0, 47.0, 49.0, 53.0, 48.0, 64.0, 43.0, 38.0, 43.0, 27.0, 20.0, 19.0, 18.0, 16.0, 22.0, 16.0, 6.0, 5.0, 8.0, 7.0, 3.0, 2.0, 8.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0], "bins": [-28.101316452026367, -27.175453186035156, -26.249591827392578, -25.323728561401367, -24.397865295410156, -23.472002029418945, -22.546138763427734, -21.620277404785156, -20.694414138793945, -19.768550872802734, -18.842689514160156, -17.916826248168945, -16.990962982177734, -16.065099716186523, -15.139237403869629, -14.213375091552734, -13.287511825561523, -12.361648559570312, -11.435786247253418, -10.509923934936523, -9.584060668945312, -8.658197402954102, -7.732335090637207, -6.806472301483154, -5.880609512329102, -4.954746723175049, -4.028883934020996, -3.1030211448669434, -2.1771583557128906, -1.251295566558838, -0.32543277740478516, 0.6004300117492676, 1.5262908935546875, 2.4521536827087402, 3.378016471862793, 4.303879261016846, 5.229742050170898, 6.155604839324951, 7.081467628479004, 8.007329940795898, 8.93319320678711, 9.85905647277832, 10.784918785095215, 11.71078109741211, 12.63664436340332, 13.562507629394531, 14.488369941711426, 15.41423225402832, 16.34009552001953, 17.265958786010742, 18.191822052001953, 19.11768341064453, 20.043546676635742, 20.969409942626953, 21.89527130126953, 22.821134567260742, 23.746997833251953, 24.672861099243164, 25.598724365234375, 26.524585723876953, 27.450448989868164, 28.376312255859375, 29.302173614501953, 30.228036880493164, 31.153900146484375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 10.0, 5.0, 11.0, 10.0, 7.0, 19.0, 15.0, 22.0, 17.0, 20.0, 21.0, 26.0, 27.0, 33.0, 35.0, 38.0, 34.0, 30.0, 39.0, 40.0, 28.0, 30.0, 30.0, 36.0, 25.0, 31.0, 40.0, 29.0, 28.0, 35.0, 30.0, 29.0, 27.0, 17.0, 17.0, 17.0, 16.0, 12.0, 6.0, 7.0, 12.0, 5.0, 9.0, 3.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0], "bins": [-28.420991897583008, -27.608470916748047, -26.795949935913086, -25.983428955078125, -25.170909881591797, -24.358386993408203, -23.545867919921875, -22.733346939086914, -21.920825958251953, -21.108304977416992, -20.29578399658203, -19.48326301574707, -18.67074203491211, -17.85822296142578, -17.04570198059082, -16.23318099975586, -15.420660018920898, -14.608139038085938, -13.795618057250977, -12.983098030090332, -12.170577049255371, -11.35805606842041, -10.545536041259766, -9.733015060424805, -8.920494079589844, -8.107973098754883, -7.29545259475708, -6.482932090759277, -5.670411109924316, -4.8578901290893555, -4.045369625091553, -3.23284912109375, -2.4203262329101562, -1.6078054904937744, -0.7952847480773926, 0.017235994338989258, 0.8297567367553711, 1.642277717590332, 2.4547982215881348, 3.2673187255859375, 4.079839706420898, 4.892360687255859, 5.704881191253662, 6.517401695251465, 7.329922676086426, 8.142443656921387, 8.954963684082031, 9.767484664916992, 10.580005645751953, 11.392526626586914, 12.205047607421875, 13.01756763458252, 13.83008861541748, 14.642609596252441, 15.455129623413086, 16.267650604248047, 17.080171585083008, 17.89269256591797, 18.70521354675293, 19.51773452758789, 20.33025360107422, 21.142776489257812, 21.95529556274414, 22.7678165435791, 23.580337524414062]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 9.0, 7.0, 9.0, 10.0, 14.0, 24.0, 38.0, 45.0, 51.0, 89.0, 155.0, 182.0, 314.0, 412.0, 578.0, 899.0, 1249.0, 1954.0, 2973.0, 4645.0, 6920.0, 10970.0, 17514.0, 29326.0, 52229.0, 108345.0, 295432.0, 852505.0, 1386435.0, 847479.0, 320843.0, 119100.0, 56137.0, 30531.0, 17605.0, 10655.0, 6609.0, 4254.0, 2650.0, 1786.0, 1109.0, 750.0, 483.0, 328.0, 230.0, 147.0, 100.0, 42.0, 44.0, 28.0, 20.0, 13.0, 12.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-38.5625, -37.4453125, -36.328125, -35.2109375, -34.09375, -32.9765625, -31.859375, -30.7421875, -29.625, -28.5078125, -27.390625, -26.2734375, -25.15625, -24.0390625, -22.921875, -21.8046875, -20.6875, -19.5703125, -18.453125, -17.3359375, -16.21875, -15.1015625, -13.984375, -12.8671875, -11.75, -10.6328125, -9.515625, -8.3984375, -7.28125, -6.1640625, -5.046875, -3.9296875, -2.8125, -1.6953125, -0.578125, 0.5390625, 1.65625, 2.7734375, 3.890625, 5.0078125, 6.125, 7.2421875, 8.359375, 9.4765625, 10.59375, 11.7109375, 12.828125, 13.9453125, 15.0625, 16.1796875, 17.296875, 18.4140625, 19.53125, 20.6484375, 21.765625, 22.8828125, 24.0, 25.1171875, 26.234375, 27.3515625, 28.46875, 29.5859375, 30.703125, 31.8203125, 32.9375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 5.0, 6.0, 8.0, 5.0, 10.0, 10.0, 12.0, 18.0, 12.0, 13.0, 12.0, 21.0, 24.0, 30.0, 15.0, 27.0, 29.0, 39.0, 29.0, 37.0, 30.0, 38.0, 39.0, 40.0, 25.0, 40.0, 32.0, 42.0, 45.0, 39.0, 24.0, 30.0, 33.0, 28.0, 29.0, 14.0, 17.0, 12.0, 11.0, 18.0, 18.0, 7.0, 5.0, 6.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-25.671875, -24.945556640625, -24.21923828125, -23.492919921875, -22.7666015625, -22.040283203125, -21.31396484375, -20.587646484375, -19.861328125, -19.135009765625, -18.40869140625, -17.682373046875, -16.9560546875, -16.229736328125, -15.50341796875, -14.777099609375, -14.05078125, -13.324462890625, -12.59814453125, -11.871826171875, -11.1455078125, -10.419189453125, -9.69287109375, -8.966552734375, -8.240234375, -7.513916015625, -6.78759765625, -6.061279296875, -5.3349609375, -4.608642578125, -3.88232421875, -3.156005859375, -2.4296875, -1.703369140625, -0.97705078125, -0.250732421875, 0.4755859375, 1.201904296875, 1.92822265625, 2.654541015625, 3.380859375, 4.107177734375, 4.83349609375, 5.559814453125, 6.2861328125, 7.012451171875, 7.73876953125, 8.465087890625, 9.19140625, 9.917724609375, 10.64404296875, 11.370361328125, 12.0966796875, 12.822998046875, 13.54931640625, 14.275634765625, 15.001953125, 15.728271484375, 16.45458984375, 17.180908203125, 17.9072265625, 18.633544921875, 19.35986328125, 20.086181640625, 20.8125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 1.0, 21.0, 33.0, 35.0, 38.0, 64.0, 98.0, 159.0, 226.0, 372.0, 508.0, 879.0, 1303.0, 2175.0, 3481.0, 5669.0, 10039.0, 17643.0, 32848.0, 62899.0, 128569.0, 293018.0, 771625.0, 1628720.0, 708548.0, 271835.0, 121760.0, 59737.0, 30933.0, 16951.0, 9594.0, 5520.0, 3315.0, 2060.0, 1298.0, 781.0, 509.0, 322.0, 235.0, 159.0, 101.0, 77.0, 44.0, 22.0, 22.0, 12.0, 4.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.09375, -39.74462890625, -38.3955078125, -37.04638671875, -35.697265625, -34.34814453125, -32.9990234375, -31.64990234375, -30.30078125, -28.95166015625, -27.6025390625, -26.25341796875, -24.904296875, -23.55517578125, -22.2060546875, -20.85693359375, -19.5078125, -18.15869140625, -16.8095703125, -15.46044921875, -14.111328125, -12.76220703125, -11.4130859375, -10.06396484375, -8.71484375, -7.36572265625, -6.0166015625, -4.66748046875, -3.318359375, -1.96923828125, -0.6201171875, 0.72900390625, 2.078125, 3.42724609375, 4.7763671875, 6.12548828125, 7.474609375, 8.82373046875, 10.1728515625, 11.52197265625, 12.87109375, 14.22021484375, 15.5693359375, 16.91845703125, 18.267578125, 19.61669921875, 20.9658203125, 22.31494140625, 23.6640625, 25.01318359375, 26.3623046875, 27.71142578125, 29.060546875, 30.40966796875, 31.7587890625, 33.10791015625, 34.45703125, 35.80615234375, 37.1552734375, 38.50439453125, 39.853515625, 41.20263671875, 42.5517578125, 43.90087890625, 45.25]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 4.0, 5.0, 9.0, 12.0, 23.0, 30.0, 29.0, 46.0, 41.0, 48.0, 83.0, 96.0, 139.0, 183.0, 247.0, 341.0, 416.0, 466.0, 431.0, 334.0, 267.0, 181.0, 169.0, 107.0, 92.0, 63.0, 56.0, 39.0, 32.0, 24.0, 16.0, 11.0, 16.0, 3.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.953125, -12.466552734375, -11.97998046875, -11.493408203125, -11.0068359375, -10.520263671875, -10.03369140625, -9.547119140625, -9.060546875, -8.573974609375, -8.08740234375, -7.600830078125, -7.1142578125, -6.627685546875, -6.14111328125, -5.654541015625, -5.16796875, -4.681396484375, -4.19482421875, -3.708251953125, -3.2216796875, -2.735107421875, -2.24853515625, -1.761962890625, -1.275390625, -0.788818359375, -0.30224609375, 0.184326171875, 0.6708984375, 1.157470703125, 1.64404296875, 2.130615234375, 2.6171875, 3.103759765625, 3.59033203125, 4.076904296875, 4.5634765625, 5.050048828125, 5.53662109375, 6.023193359375, 6.509765625, 6.996337890625, 7.48291015625, 7.969482421875, 8.4560546875, 8.942626953125, 9.42919921875, 9.915771484375, 10.40234375, 10.888916015625, 11.37548828125, 11.862060546875, 12.3486328125, 12.835205078125, 13.32177734375, 13.808349609375, 14.294921875, 14.781494140625, 15.26806640625, 15.754638671875, 16.2412109375, 16.727783203125, 17.21435546875, 17.700927734375, 18.1875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 10.0, 6.0, 13.0, 8.0, 19.0, 24.0, 26.0, 35.0, 39.0, 45.0, 54.0, 76.0, 62.0, 67.0, 82.0, 69.0, 73.0, 60.0, 43.0, 32.0, 29.0, 31.0, 15.0, 17.0, 16.0, 7.0, 12.0, 5.0, 5.0, 2.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-43.4337272644043, -42.22896194458008, -41.024200439453125, -39.819435119628906, -38.61466979980469, -37.40990447998047, -36.20513916015625, -35.0003776550293, -33.79561233520508, -32.59084701538086, -31.386083602905273, -30.181320190429688, -28.97655487060547, -27.77178955078125, -26.567026138305664, -25.362262725830078, -24.15749740600586, -22.95273208618164, -21.747968673706055, -20.54320526123047, -19.33843994140625, -18.13367462158203, -16.928911209106445, -15.724146842956543, -14.51938247680664, -13.314618110656738, -12.109853744506836, -10.905089378356934, -9.700325012207031, -8.495560646057129, -7.290796279907227, -6.086031913757324, -4.8812713623046875, -3.676506996154785, -2.471742630004883, -1.2669782638549805, -0.062213897705078125, 1.1425504684448242, 2.3473148345947266, 3.552079200744629, 4.756843566894531, 5.961607933044434, 7.166372299194336, 8.371136665344238, 9.57590103149414, 10.780665397644043, 11.985429763793945, 13.190194129943848, 14.39495849609375, 15.599722862243652, 16.804487228393555, 18.00925064086914, 19.21401596069336, 20.418781280517578, 21.623544692993164, 22.82830810546875, 24.03307342529297, 25.237838745117188, 26.442602157592773, 27.64736557006836, 28.852130889892578, 30.056896209716797, 31.261659622192383, 32.46642303466797, 33.67118835449219]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 15.0, 9.0, 8.0, 10.0, 17.0, 18.0, 16.0, 14.0, 23.0, 23.0, 23.0, 26.0, 34.0, 30.0, 37.0, 37.0, 44.0, 41.0, 41.0, 33.0, 51.0, 34.0, 37.0, 36.0, 35.0, 35.0, 25.0, 35.0, 29.0, 19.0, 15.0, 21.0, 22.0, 22.0, 12.0, 16.0, 8.0, 10.0, 8.0, 7.0, 6.0, 5.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.403141021728516, -27.558950424194336, -26.714757919311523, -25.870567321777344, -25.026376724243164, -24.182186126708984, -23.337993621826172, -22.493803024291992, -21.649612426757812, -20.805421829223633, -19.96122932434082, -19.11703872680664, -18.27284812927246, -17.42865753173828, -16.58446502685547, -15.740274429321289, -14.896081924438477, -14.05189037322998, -13.2076997756958, -12.363508224487305, -11.519317626953125, -10.675126075744629, -9.830934524536133, -8.986743927001953, -8.142552375793457, -7.298361301422119, -6.454170227050781, -5.609978675842285, -4.765787601470947, -3.9215965270996094, -3.0774049758911133, -2.2332139015197754, -1.3890228271484375, -0.5448316335678101, 0.2993595600128174, 1.1435508728027344, 1.9877419471740723, 2.83193302154541, 3.6761245727539062, 4.520315647125244, 5.364506721496582, 6.20869779586792, 7.052888870239258, 7.897080421447754, 8.74127197265625, 9.58546257019043, 10.429654121398926, 11.273845672607422, 12.118036270141602, 12.962227821350098, 13.806418418884277, 14.650609970092773, 15.494800567626953, 16.338993072509766, 17.183183670043945, 18.027374267578125, 18.871566772460938, 19.715757369995117, 20.55994987487793, 21.40414047241211, 22.24833106994629, 23.09252166748047, 23.93671417236328, 24.78090476989746, 25.62509536743164]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 9.0, 11.0, 27.0, 30.0, 45.0, 62.0, 93.0, 143.0, 210.0, 359.0, 516.0, 911.0, 1582.0, 2843.0, 4881.0, 8905.0, 16162.0, 30746.0, 59894.0, 127007.0, 271466.0, 268490.0, 127189.0, 59912.0, 30562.0, 16110.0, 8726.0, 4836.0, 2793.0, 1533.0, 949.0, 558.0, 335.0, 216.0, 134.0, 102.0, 70.0, 37.0, 23.0, 22.0, 16.0, 16.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -27.927490234375, -26.96435546875, -26.001220703125, -25.0380859375, -24.074951171875, -23.11181640625, -22.148681640625, -21.185546875, -20.222412109375, -19.25927734375, -18.296142578125, -17.3330078125, -16.369873046875, -15.40673828125, -14.443603515625, -13.48046875, -12.517333984375, -11.55419921875, -10.591064453125, -9.6279296875, -8.664794921875, -7.70166015625, -6.738525390625, -5.775390625, -4.812255859375, -3.84912109375, -2.885986328125, -1.9228515625, -0.959716796875, 0.00341796875, 0.966552734375, 1.9296875, 2.892822265625, 3.85595703125, 4.819091796875, 5.7822265625, 6.745361328125, 7.70849609375, 8.671630859375, 9.634765625, 10.597900390625, 11.56103515625, 12.524169921875, 13.4873046875, 14.450439453125, 15.41357421875, 16.376708984375, 17.33984375, 18.302978515625, 19.26611328125, 20.229248046875, 21.1923828125, 22.155517578125, 23.11865234375, 24.081787109375, 25.044921875, 26.008056640625, 26.97119140625, 27.934326171875, 28.8974609375, 29.860595703125, 30.82373046875, 31.786865234375, 32.75]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 7.0, 6.0, 13.0, 17.0, 14.0, 20.0, 7.0, 16.0, 19.0, 26.0, 26.0, 25.0, 34.0, 35.0, 43.0, 31.0, 33.0, 44.0, 46.0, 34.0, 43.0, 41.0, 30.0, 40.0, 35.0, 24.0, 34.0, 29.0, 30.0, 28.0, 16.0, 16.0, 19.0, 15.0, 15.0, 13.0, 19.0, 12.0, 4.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.25, -27.404052734375, -26.55810546875, -25.712158203125, -24.8662109375, -24.020263671875, -23.17431640625, -22.328369140625, -21.482421875, -20.636474609375, -19.79052734375, -18.944580078125, -18.0986328125, -17.252685546875, -16.40673828125, -15.560791015625, -14.71484375, -13.868896484375, -13.02294921875, -12.177001953125, -11.3310546875, -10.485107421875, -9.63916015625, -8.793212890625, -7.947265625, -7.101318359375, -6.25537109375, -5.409423828125, -4.5634765625, -3.717529296875, -2.87158203125, -2.025634765625, -1.1796875, -0.333740234375, 0.51220703125, 1.358154296875, 2.2041015625, 3.050048828125, 3.89599609375, 4.741943359375, 5.587890625, 6.433837890625, 7.27978515625, 8.125732421875, 8.9716796875, 9.817626953125, 10.66357421875, 11.509521484375, 12.35546875, 13.201416015625, 14.04736328125, 14.893310546875, 15.7392578125, 16.585205078125, 17.43115234375, 18.277099609375, 19.123046875, 19.968994140625, 20.81494140625, 21.660888671875, 22.5068359375, 23.352783203125, 24.19873046875, 25.044677734375, 25.890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 8.0, 9.0, 18.0, 35.0, 58.0, 62.0, 100.0, 155.0, 197.0, 352.0, 550.0, 901.0, 1409.0, 2295.0, 3898.0, 6346.0, 11108.0, 20127.0, 39549.0, 87323.0, 226993.0, 363424.0, 152195.0, 63045.0, 30192.0, 15956.0, 8876.0, 5144.0, 3067.0, 1914.0, 1175.0, 754.0, 426.0, 313.0, 199.0, 117.0, 82.0, 55.0, 44.0, 32.0, 20.0, 8.0, 7.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.40625, -37.21728515625, -36.0283203125, -34.83935546875, -33.650390625, -32.46142578125, -31.2724609375, -30.08349609375, -28.89453125, -27.70556640625, -26.5166015625, -25.32763671875, -24.138671875, -22.94970703125, -21.7607421875, -20.57177734375, -19.3828125, -18.19384765625, -17.0048828125, -15.81591796875, -14.626953125, -13.43798828125, -12.2490234375, -11.06005859375, -9.87109375, -8.68212890625, -7.4931640625, -6.30419921875, -5.115234375, -3.92626953125, -2.7373046875, -1.54833984375, -0.359375, 0.82958984375, 2.0185546875, 3.20751953125, 4.396484375, 5.58544921875, 6.7744140625, 7.96337890625, 9.15234375, 10.34130859375, 11.5302734375, 12.71923828125, 13.908203125, 15.09716796875, 16.2861328125, 17.47509765625, 18.6640625, 19.85302734375, 21.0419921875, 22.23095703125, 23.419921875, 24.60888671875, 25.7978515625, 26.98681640625, 28.17578125, 29.36474609375, 30.5537109375, 31.74267578125, 32.931640625, 34.12060546875, 35.3095703125, 36.49853515625, 37.6875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 9.0, 3.0, 8.0, 9.0, 13.0, 19.0, 14.0, 18.0, 21.0, 20.0, 26.0, 33.0, 28.0, 39.0, 38.0, 43.0, 51.0, 46.0, 49.0, 41.0, 44.0, 37.0, 46.0, 35.0, 43.0, 43.0, 32.0, 25.0, 18.0, 29.0, 21.0, 24.0, 15.0, 7.0, 10.0, 9.0, 5.0, 9.0, 4.0, 1.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.703125, -20.0712890625, -19.439453125, -18.8076171875, -18.17578125, -17.5439453125, -16.912109375, -16.2802734375, -15.6484375, -15.0166015625, -14.384765625, -13.7529296875, -13.12109375, -12.4892578125, -11.857421875, -11.2255859375, -10.59375, -9.9619140625, -9.330078125, -8.6982421875, -8.06640625, -7.4345703125, -6.802734375, -6.1708984375, -5.5390625, -4.9072265625, -4.275390625, -3.6435546875, -3.01171875, -2.3798828125, -1.748046875, -1.1162109375, -0.484375, 0.1474609375, 0.779296875, 1.4111328125, 2.04296875, 2.6748046875, 3.306640625, 3.9384765625, 4.5703125, 5.2021484375, 5.833984375, 6.4658203125, 7.09765625, 7.7294921875, 8.361328125, 8.9931640625, 9.625, 10.2568359375, 10.888671875, 11.5205078125, 12.15234375, 12.7841796875, 13.416015625, 14.0478515625, 14.6796875, 15.3115234375, 15.943359375, 16.5751953125, 17.20703125, 17.8388671875, 18.470703125, 19.1025390625, 19.734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 12.0, 9.0, 15.0, 27.0, 36.0, 43.0, 51.0, 87.0, 104.0, 173.0, 254.0, 364.0, 545.0, 845.0, 1400.0, 2192.0, 3773.0, 6596.0, 12241.0, 25278.0, 56288.0, 133764.0, 308554.0, 279554.0, 117789.0, 49360.0, 22486.0, 11294.0, 6004.0, 3468.0, 2095.0, 1365.0, 819.0, 564.0, 373.0, 219.0, 148.0, 104.0, 65.0, 58.0, 33.0, 27.0, 18.0, 13.0, 14.0, 8.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0], "bins": [-10.2734375, -9.96142578125, -9.6494140625, -9.33740234375, -9.025390625, -8.71337890625, -8.4013671875, -8.08935546875, -7.77734375, -7.46533203125, -7.1533203125, -6.84130859375, -6.529296875, -6.21728515625, -5.9052734375, -5.59326171875, -5.28125, -4.96923828125, -4.6572265625, -4.34521484375, -4.033203125, -3.72119140625, -3.4091796875, -3.09716796875, -2.78515625, -2.47314453125, -2.1611328125, -1.84912109375, -1.537109375, -1.22509765625, -0.9130859375, -0.60107421875, -0.2890625, 0.02294921875, 0.3349609375, 0.64697265625, 0.958984375, 1.27099609375, 1.5830078125, 1.89501953125, 2.20703125, 2.51904296875, 2.8310546875, 3.14306640625, 3.455078125, 3.76708984375, 4.0791015625, 4.39111328125, 4.703125, 5.01513671875, 5.3271484375, 5.63916015625, 5.951171875, 6.26318359375, 6.5751953125, 6.88720703125, 7.19921875, 7.51123046875, 7.8232421875, 8.13525390625, 8.447265625, 8.75927734375, 9.0712890625, 9.38330078125, 9.6953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 9.0, 9.0, 11.0, 22.0, 32.0, 29.0, 30.0, 39.0, 51.0, 67.0, 59.0, 75.0, 67.0, 64.0, 58.0, 63.0, 58.0, 43.0, 34.0, 29.0, 26.0, 25.0, 19.0, 18.0, 7.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006732940673828125, -0.0006482452154159546, -0.0006231963634490967, -0.0005981475114822388, -0.0005730986595153809, -0.000548049807548523, -0.000523000955581665, -0.0004979521036148071, -0.0004729032516479492, -0.0004478543996810913, -0.0004228055477142334, -0.0003977566957473755, -0.0003727078437805176, -0.00034765899181365967, -0.00032261013984680176, -0.00029756128787994385, -0.00027251243591308594, -0.00024746358394622803, -0.00022241473197937012, -0.0001973658800125122, -0.0001723170280456543, -0.0001472681760787964, -0.00012221932411193848, -9.717047214508057e-05, -7.212162017822266e-05, -4.7072768211364746e-05, -2.2023916244506836e-05, 3.0249357223510742e-06, 2.8073787689208984e-05, 5.3122639656066895e-05, 7.81714916229248e-05, 0.00010322034358978271, 0.00012826919555664062, 0.00015331804752349854, 0.00017836689949035645, 0.00020341575145721436, 0.00022846460342407227, 0.0002535134553909302, 0.0002785623073577881, 0.000303611159324646, 0.0003286600112915039, 0.0003537088632583618, 0.0003787577152252197, 0.00040380656719207764, 0.00042885541915893555, 0.00045390427112579346, 0.00047895312309265137, 0.0005040019750595093, 0.0005290508270263672, 0.0005540996789932251, 0.000579148530960083, 0.0006041973829269409, 0.0006292462348937988, 0.0006542950868606567, 0.0006793439388275146, 0.0007043927907943726, 0.0007294416427612305, 0.0007544904947280884, 0.0007795393466949463, 0.0008045881986618042, 0.0008296370506286621, 0.00085468590259552, 0.0008797347545623779, 0.0009047836065292358, 0.0009298324584960938]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 7.0, 8.0, 10.0, 26.0, 24.0, 36.0, 49.0, 60.0, 103.0, 155.0, 228.0, 315.0, 487.0, 802.0, 1391.0, 2262.0, 4103.0, 7155.0, 13721.0, 27192.0, 56831.0, 132686.0, 284589.0, 277865.0, 127116.0, 55081.0, 26162.0, 13188.0, 7107.0, 3941.0, 2298.0, 1318.0, 761.0, 459.0, 310.0, 231.0, 143.0, 97.0, 71.0, 37.0, 42.0, 25.0, 19.0, 8.0, 14.0, 11.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.515625, -11.1314697265625, -10.747314453125, -10.3631591796875, -9.97900390625, -9.5948486328125, -9.210693359375, -8.8265380859375, -8.4423828125, -8.0582275390625, -7.674072265625, -7.2899169921875, -6.90576171875, -6.5216064453125, -6.137451171875, -5.7532958984375, -5.369140625, -4.9849853515625, -4.600830078125, -4.2166748046875, -3.83251953125, -3.4483642578125, -3.064208984375, -2.6800537109375, -2.2958984375, -1.9117431640625, -1.527587890625, -1.1434326171875, -0.75927734375, -0.3751220703125, 0.009033203125, 0.3931884765625, 0.77734375, 1.1614990234375, 1.545654296875, 1.9298095703125, 2.31396484375, 2.6981201171875, 3.082275390625, 3.4664306640625, 3.8505859375, 4.2347412109375, 4.618896484375, 5.0030517578125, 5.38720703125, 5.7713623046875, 6.155517578125, 6.5396728515625, 6.923828125, 7.3079833984375, 7.692138671875, 8.0762939453125, 8.46044921875, 8.8446044921875, 9.228759765625, 9.6129150390625, 9.9970703125, 10.3812255859375, 10.765380859375, 11.1495361328125, 11.53369140625, 11.9178466796875, 12.302001953125, 12.6861572265625, 13.0703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 10.0, 7.0, 8.0, 12.0, 7.0, 16.0, 26.0, 23.0, 18.0, 25.0, 44.0, 59.0, 48.0, 67.0, 85.0, 61.0, 74.0, 84.0, 52.0, 43.0, 30.0, 41.0, 33.0, 17.0, 23.0, 12.0, 16.0, 11.0, 8.0, 6.0, 5.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7421875, -3.6197509765625, -3.497314453125, -3.3748779296875, -3.25244140625, -3.1300048828125, -3.007568359375, -2.8851318359375, -2.7626953125, -2.6402587890625, -2.517822265625, -2.3953857421875, -2.27294921875, -2.1505126953125, -2.028076171875, -1.9056396484375, -1.783203125, -1.6607666015625, -1.538330078125, -1.4158935546875, -1.29345703125, -1.1710205078125, -1.048583984375, -0.9261474609375, -0.8037109375, -0.6812744140625, -0.558837890625, -0.4364013671875, -0.31396484375, -0.1915283203125, -0.069091796875, 0.0533447265625, 0.17578125, 0.2982177734375, 0.420654296875, 0.5430908203125, 0.66552734375, 0.7879638671875, 0.910400390625, 1.0328369140625, 1.1552734375, 1.2777099609375, 1.400146484375, 1.5225830078125, 1.64501953125, 1.7674560546875, 1.889892578125, 2.0123291015625, 2.134765625, 2.2572021484375, 2.379638671875, 2.5020751953125, 2.62451171875, 2.7469482421875, 2.869384765625, 2.9918212890625, 3.1142578125, 3.2366943359375, 3.359130859375, 3.4815673828125, 3.60400390625, 3.7264404296875, 3.848876953125, 3.9713134765625, 4.09375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 11.0, 12.0, 16.0, 13.0, 20.0, 24.0, 33.0, 39.0, 33.0, 57.0, 62.0, 73.0, 64.0, 79.0, 70.0, 71.0, 76.0, 45.0, 31.0, 39.0, 22.0, 17.0, 16.0, 20.0, 12.0, 9.0, 7.0, 6.0, 1.0, 4.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.1654167175293, -42.00754928588867, -40.84968185424805, -39.69181442260742, -38.53395080566406, -37.37608337402344, -36.21821594238281, -35.06034851074219, -33.90248107910156, -32.74461364746094, -31.586746215820312, -30.42888069152832, -29.271013259887695, -28.11314582824707, -26.955280303955078, -25.797412872314453, -24.639545440673828, -23.481678009033203, -22.323810577392578, -21.165945053100586, -20.00807762145996, -18.850210189819336, -17.692344665527344, -16.53447723388672, -15.376609802246094, -14.218742370605469, -13.06087589263916, -11.903009414672852, -10.745141983032227, -9.587274551391602, -8.429408073425293, -7.271541595458984, -6.113676071166992, -4.955809116363525, -3.7979421615600586, -2.640075206756592, -1.482208251953125, -0.3243412971496582, 0.8335256576538086, 1.9913921356201172, 3.149259567260742, 4.307126522064209, 5.464993476867676, 6.622860431671143, 7.780727386474609, 8.938594818115234, 10.096461296081543, 11.254327774047852, 12.412195205688477, 13.570062637329102, 14.72792911529541, 15.885795593261719, 17.043663024902344, 18.20153045654297, 19.359397888183594, 20.517263412475586, 21.67513084411621, 22.832998275756836, 23.990863800048828, 25.148731231689453, 26.306598663330078, 27.464466094970703, 28.622333526611328, 29.78019905090332, 30.938066482543945]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 8.0, 7.0, 7.0, 17.0, 12.0, 17.0, 20.0, 21.0, 17.0, 22.0, 17.0, 26.0, 32.0, 35.0, 35.0, 40.0, 31.0, 44.0, 47.0, 29.0, 42.0, 45.0, 39.0, 44.0, 37.0, 33.0, 22.0, 29.0, 28.0, 18.0, 21.0, 20.0, 20.0, 24.0, 13.0, 14.0, 11.0, 10.0, 9.0, 5.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.629261016845703, -25.817188262939453, -25.005117416381836, -24.193044662475586, -23.380971908569336, -22.56890106201172, -21.75682830810547, -20.94475555419922, -20.13268280029297, -19.32061004638672, -18.5085391998291, -17.69646644592285, -16.8843936920166, -16.072322845458984, -15.260250091552734, -14.448177337646484, -13.636106491088867, -12.824034690856934, -12.011961936950684, -11.19989013671875, -10.3878173828125, -9.575745582580566, -8.763673782348633, -7.951601505279541, -7.139529228210449, -6.327456951141357, -5.515384674072266, -4.703312873840332, -3.8912405967712402, -3.0791683197021484, -2.267096519470215, -1.455024242401123, -0.6429519653320312, 0.169120192527771, 0.9811923503875732, 1.793264389038086, 2.6053366661071777, 3.4174089431762695, 4.229480743408203, 5.041553020477295, 5.853625297546387, 6.6656975746154785, 7.47776985168457, 8.289841651916504, 9.101913452148438, 9.913986206054688, 10.726058006286621, 11.538129806518555, 12.350202560424805, 13.162274360656738, 13.974347114562988, 14.786418914794922, 15.598491668701172, 16.410564422607422, 17.22263526916504, 18.03470802307129, 18.846778869628906, 19.658851623535156, 20.470922470092773, 21.282995223999023, 22.095067977905273, 22.90713882446289, 23.71921157836914, 24.53128433227539, 25.34335708618164]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 4.0, 9.0, 7.0, 7.0, 26.0, 29.0, 46.0, 66.0, 94.0, 103.0, 193.0, 275.0, 418.0, 595.0, 867.0, 1227.0, 1786.0, 2693.0, 3842.0, 5901.0, 8841.0, 13363.0, 20522.0, 31955.0, 49995.0, 79080.0, 121049.0, 167738.0, 172279.0, 128502.0, 84280.0, 53910.0, 34106.0, 21931.0, 14165.0, 9448.0, 6216.0, 4192.0, 2840.0, 1916.0, 1252.0, 872.0, 614.0, 428.0, 273.0, 184.0, 155.0, 73.0, 70.0, 44.0, 27.0, 21.0, 12.0, 8.0, 6.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-28.625, -27.703857421875, -26.78271484375, -25.861572265625, -24.9404296875, -24.019287109375, -23.09814453125, -22.177001953125, -21.255859375, -20.334716796875, -19.41357421875, -18.492431640625, -17.5712890625, -16.650146484375, -15.72900390625, -14.807861328125, -13.88671875, -12.965576171875, -12.04443359375, -11.123291015625, -10.2021484375, -9.281005859375, -8.35986328125, -7.438720703125, -6.517578125, -5.596435546875, -4.67529296875, -3.754150390625, -2.8330078125, -1.911865234375, -0.99072265625, -0.069580078125, 0.8515625, 1.772705078125, 2.69384765625, 3.614990234375, 4.5361328125, 5.457275390625, 6.37841796875, 7.299560546875, 8.220703125, 9.141845703125, 10.06298828125, 10.984130859375, 11.9052734375, 12.826416015625, 13.74755859375, 14.668701171875, 15.58984375, 16.510986328125, 17.43212890625, 18.353271484375, 19.2744140625, 20.195556640625, 21.11669921875, 22.037841796875, 22.958984375, 23.880126953125, 24.80126953125, 25.722412109375, 26.6435546875, 27.564697265625, 28.48583984375, 29.406982421875, 30.328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 7.0, 3.0, 9.0, 8.0, 13.0, 14.0, 18.0, 14.0, 14.0, 16.0, 30.0, 21.0, 28.0, 31.0, 41.0, 35.0, 34.0, 27.0, 43.0, 41.0, 46.0, 30.0, 51.0, 48.0, 32.0, 36.0, 37.0, 29.0, 28.0, 21.0, 24.0, 19.0, 21.0, 23.0, 16.0, 20.0, 13.0, 12.0, 12.0, 11.0, 3.0, 7.0, 1.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.671875, -25.84326171875, -25.0146484375, -24.18603515625, -23.357421875, -22.52880859375, -21.7001953125, -20.87158203125, -20.04296875, -19.21435546875, -18.3857421875, -17.55712890625, -16.728515625, -15.89990234375, -15.0712890625, -14.24267578125, -13.4140625, -12.58544921875, -11.7568359375, -10.92822265625, -10.099609375, -9.27099609375, -8.4423828125, -7.61376953125, -6.78515625, -5.95654296875, -5.1279296875, -4.29931640625, -3.470703125, -2.64208984375, -1.8134765625, -0.98486328125, -0.15625, 0.67236328125, 1.5009765625, 2.32958984375, 3.158203125, 3.98681640625, 4.8154296875, 5.64404296875, 6.47265625, 7.30126953125, 8.1298828125, 8.95849609375, 9.787109375, 10.61572265625, 11.4443359375, 12.27294921875, 13.1015625, 13.93017578125, 14.7587890625, 15.58740234375, 16.416015625, 17.24462890625, 18.0732421875, 18.90185546875, 19.73046875, 20.55908203125, 21.3876953125, 22.21630859375, 23.044921875, 23.87353515625, 24.7021484375, 25.53076171875, 26.359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 10.0, 8.0, 18.0, 15.0, 38.0, 42.0, 73.0, 131.0, 223.0, 293.0, 510.0, 806.0, 1214.0, 1953.0, 2997.0, 4762.0, 7716.0, 12501.0, 20206.0, 33788.0, 58153.0, 101080.0, 168514.0, 218334.0, 168854.0, 101090.0, 57975.0, 33532.0, 20255.0, 12409.0, 7718.0, 4829.0, 3123.0, 2021.0, 1237.0, 783.0, 449.0, 351.0, 193.0, 156.0, 73.0, 48.0, 33.0, 20.0, 10.0, 11.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.53125, -36.37646484375, -35.2216796875, -34.06689453125, -32.912109375, -31.75732421875, -30.6025390625, -29.44775390625, -28.29296875, -27.13818359375, -25.9833984375, -24.82861328125, -23.673828125, -22.51904296875, -21.3642578125, -20.20947265625, -19.0546875, -17.89990234375, -16.7451171875, -15.59033203125, -14.435546875, -13.28076171875, -12.1259765625, -10.97119140625, -9.81640625, -8.66162109375, -7.5068359375, -6.35205078125, -5.197265625, -4.04248046875, -2.8876953125, -1.73291015625, -0.578125, 0.57666015625, 1.7314453125, 2.88623046875, 4.041015625, 5.19580078125, 6.3505859375, 7.50537109375, 8.66015625, 9.81494140625, 10.9697265625, 12.12451171875, 13.279296875, 14.43408203125, 15.5888671875, 16.74365234375, 17.8984375, 19.05322265625, 20.2080078125, 21.36279296875, 22.517578125, 23.67236328125, 24.8271484375, 25.98193359375, 27.13671875, 28.29150390625, 29.4462890625, 30.60107421875, 31.755859375, 32.91064453125, 34.0654296875, 35.22021484375, 36.375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 5.0, 7.0, 7.0, 8.0, 8.0, 7.0, 16.0, 21.0, 19.0, 11.0, 18.0, 18.0, 26.0, 23.0, 25.0, 25.0, 42.0, 26.0, 41.0, 39.0, 35.0, 47.0, 36.0, 38.0, 46.0, 43.0, 28.0, 37.0, 35.0, 39.0, 29.0, 32.0, 29.0, 12.0, 16.0, 20.0, 20.0, 14.0, 9.0, 15.0, 8.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.75, -17.2158203125, -16.681640625, -16.1474609375, -15.61328125, -15.0791015625, -14.544921875, -14.0107421875, -13.4765625, -12.9423828125, -12.408203125, -11.8740234375, -11.33984375, -10.8056640625, -10.271484375, -9.7373046875, -9.203125, -8.6689453125, -8.134765625, -7.6005859375, -7.06640625, -6.5322265625, -5.998046875, -5.4638671875, -4.9296875, -4.3955078125, -3.861328125, -3.3271484375, -2.79296875, -2.2587890625, -1.724609375, -1.1904296875, -0.65625, -0.1220703125, 0.412109375, 0.9462890625, 1.48046875, 2.0146484375, 2.548828125, 3.0830078125, 3.6171875, 4.1513671875, 4.685546875, 5.2197265625, 5.75390625, 6.2880859375, 6.822265625, 7.3564453125, 7.890625, 8.4248046875, 8.958984375, 9.4931640625, 10.02734375, 10.5615234375, 11.095703125, 11.6298828125, 12.1640625, 12.6982421875, 13.232421875, 13.7666015625, 14.30078125, 14.8349609375, 15.369140625, 15.9033203125, 16.4375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 15.0, 15.0, 29.0, 30.0, 48.0, 65.0, 105.0, 156.0, 208.0, 327.0, 494.0, 727.0, 1156.0, 1781.0, 2919.0, 4789.0, 7852.0, 13825.0, 25051.0, 46071.0, 89734.0, 172152.0, 259253.0, 196347.0, 103955.0, 53728.0, 28562.0, 15783.0, 9036.0, 5321.0, 3257.0, 2043.0, 1243.0, 818.0, 540.0, 357.0, 228.0, 157.0, 107.0, 78.0, 46.0, 42.0, 29.0, 19.0, 16.0, 7.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-13.296875, -12.88916015625, -12.4814453125, -12.07373046875, -11.666015625, -11.25830078125, -10.8505859375, -10.44287109375, -10.03515625, -9.62744140625, -9.2197265625, -8.81201171875, -8.404296875, -7.99658203125, -7.5888671875, -7.18115234375, -6.7734375, -6.36572265625, -5.9580078125, -5.55029296875, -5.142578125, -4.73486328125, -4.3271484375, -3.91943359375, -3.51171875, -3.10400390625, -2.6962890625, -2.28857421875, -1.880859375, -1.47314453125, -1.0654296875, -0.65771484375, -0.25, 0.15771484375, 0.5654296875, 0.97314453125, 1.380859375, 1.78857421875, 2.1962890625, 2.60400390625, 3.01171875, 3.41943359375, 3.8271484375, 4.23486328125, 4.642578125, 5.05029296875, 5.4580078125, 5.86572265625, 6.2734375, 6.68115234375, 7.0888671875, 7.49658203125, 7.904296875, 8.31201171875, 8.7197265625, 9.12744140625, 9.53515625, 9.94287109375, 10.3505859375, 10.75830078125, 11.166015625, 11.57373046875, 11.9814453125, 12.38916015625, 12.796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 9.0, 10.0, 12.0, 12.0, 15.0, 25.0, 37.0, 52.0, 88.0, 96.0, 128.0, 113.0, 112.0, 87.0, 59.0, 45.0, 27.0, 18.0, 18.0, 12.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017309188842773438, -0.0016647130250930786, -0.0015985071659088135, -0.0015323013067245483, -0.0014660954475402832, -0.001399889588356018, -0.001333683729171753, -0.0012674778699874878, -0.0012012720108032227, -0.0011350661516189575, -0.0010688602924346924, -0.0010026544332504272, -0.0009364485740661621, -0.000870242714881897, -0.0008040368556976318, -0.0007378309965133667, -0.0006716251373291016, -0.0006054192781448364, -0.0005392134189605713, -0.00047300755977630615, -0.000406801700592041, -0.0003405958414077759, -0.00027438998222351074, -0.0002081841230392456, -0.00014197826385498047, -7.577240467071533e-05, -9.566545486450195e-06, 5.663931369781494e-05, 0.00012284517288208008, 0.00018905103206634521, 0.00025525689125061035, 0.0003214627504348755, 0.0003876686096191406, 0.00045387446880340576, 0.0005200803279876709, 0.000586286187171936, 0.0006524920463562012, 0.0007186979055404663, 0.0007849037647247314, 0.0008511096239089966, 0.0009173154830932617, 0.0009835213422775269, 0.001049727201461792, 0.0011159330606460571, 0.0011821389198303223, 0.0012483447790145874, 0.0013145506381988525, 0.0013807564973831177, 0.0014469623565673828, 0.001513168215751648, 0.001579374074935913, 0.0016455799341201782, 0.0017117857933044434, 0.0017779916524887085, 0.0018441975116729736, 0.0019104033708572388, 0.001976609230041504, 0.002042815089225769, 0.002109020948410034, 0.0021752268075942993, 0.0022414326667785645, 0.0023076385259628296, 0.0023738443851470947, 0.00244005024433136, 0.002506256103515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 7.0, 9.0, 16.0, 20.0, 32.0, 45.0, 55.0, 71.0, 96.0, 143.0, 188.0, 267.0, 403.0, 527.0, 760.0, 1043.0, 1682.0, 2420.0, 3479.0, 5413.0, 8295.0, 13206.0, 21171.0, 35188.0, 58665.0, 99786.0, 165383.0, 215301.0, 163863.0, 99056.0, 58414.0, 34835.0, 21127.0, 13155.0, 8088.0, 5241.0, 3455.0, 2332.0, 1590.0, 1065.0, 795.0, 548.0, 359.0, 269.0, 198.0, 138.0, 106.0, 75.0, 62.0, 33.0, 28.0, 23.0, 13.0, 12.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0], "bins": [-10.8515625, -10.5069580078125, -10.162353515625, -9.8177490234375, -9.47314453125, -9.1285400390625, -8.783935546875, -8.4393310546875, -8.0947265625, -7.7501220703125, -7.405517578125, -7.0609130859375, -6.71630859375, -6.3717041015625, -6.027099609375, -5.6824951171875, -5.337890625, -4.9932861328125, -4.648681640625, -4.3040771484375, -3.95947265625, -3.6148681640625, -3.270263671875, -2.9256591796875, -2.5810546875, -2.2364501953125, -1.891845703125, -1.5472412109375, -1.20263671875, -0.8580322265625, -0.513427734375, -0.1688232421875, 0.17578125, 0.5203857421875, 0.864990234375, 1.2095947265625, 1.55419921875, 1.8988037109375, 2.243408203125, 2.5880126953125, 2.9326171875, 3.2772216796875, 3.621826171875, 3.9664306640625, 4.31103515625, 4.6556396484375, 5.000244140625, 5.3448486328125, 5.689453125, 6.0340576171875, 6.378662109375, 6.7232666015625, 7.06787109375, 7.4124755859375, 7.757080078125, 8.1016845703125, 8.4462890625, 8.7908935546875, 9.135498046875, 9.4801025390625, 9.82470703125, 10.1693115234375, 10.513916015625, 10.8585205078125, 11.203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 9.0, 13.0, 14.0, 14.0, 22.0, 25.0, 36.0, 31.0, 25.0, 44.0, 44.0, 45.0, 71.0, 72.0, 70.0, 54.0, 50.0, 56.0, 48.0, 29.0, 35.0, 39.0, 23.0, 26.0, 18.0, 12.0, 12.0, 6.0, 2.0, 5.0, 4.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.0289306640625, -3.885986328125, -3.7430419921875, -3.60009765625, -3.4571533203125, -3.314208984375, -3.1712646484375, -3.0283203125, -2.8853759765625, -2.742431640625, -2.5994873046875, -2.45654296875, -2.3135986328125, -2.170654296875, -2.0277099609375, -1.884765625, -1.7418212890625, -1.598876953125, -1.4559326171875, -1.31298828125, -1.1700439453125, -1.027099609375, -0.8841552734375, -0.7412109375, -0.5982666015625, -0.455322265625, -0.3123779296875, -0.16943359375, -0.0264892578125, 0.116455078125, 0.2593994140625, 0.40234375, 0.5452880859375, 0.688232421875, 0.8311767578125, 0.97412109375, 1.1170654296875, 1.260009765625, 1.4029541015625, 1.5458984375, 1.6888427734375, 1.831787109375, 1.9747314453125, 2.11767578125, 2.2606201171875, 2.403564453125, 2.5465087890625, 2.689453125, 2.8323974609375, 2.975341796875, 3.1182861328125, 3.26123046875, 3.4041748046875, 3.547119140625, 3.6900634765625, 3.8330078125, 3.9759521484375, 4.118896484375, 4.2618408203125, 4.40478515625, 4.5477294921875, 4.690673828125, 4.8336181640625, 4.9765625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 10.0, 9.0, 10.0, 12.0, 23.0, 14.0, 33.0, 25.0, 34.0, 52.0, 52.0, 51.0, 69.0, 80.0, 69.0, 71.0, 63.0, 56.0, 50.0, 37.0, 38.0, 32.0, 24.0, 20.0, 17.0, 10.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.26683807373047, -42.10720443725586, -40.947574615478516, -39.787940979003906, -38.62831115722656, -37.46867752075195, -36.30904769897461, -35.1494140625, -33.989784240722656, -32.83015060424805, -31.670520782470703, -30.510889053344727, -29.35125732421875, -28.19162368774414, -27.031991958618164, -25.872360229492188, -24.712726593017578, -23.5530948638916, -22.393463134765625, -21.23383140563965, -20.074199676513672, -18.914566040039062, -17.754934310913086, -16.59530258178711, -15.435670852661133, -14.276039123535156, -13.11640739440918, -11.956774711608887, -10.79714298248291, -9.637511253356934, -8.47787857055664, -7.318246841430664, -6.158613204956055, -4.998981475830078, -3.8393492698669434, -2.6797173023223877, -1.520085334777832, -0.36045360565185547, 0.7991786003112793, 1.958810806274414, 3.1184425354003906, 4.278074264526367, 5.437706470489502, 6.597338676452637, 7.756970405578613, 8.91660213470459, 10.076234817504883, 11.23586654663086, 12.395498275756836, 13.555130004882812, 14.714761734008789, 15.874394416809082, 17.034027099609375, 18.19365692138672, 19.353290557861328, 20.512922286987305, 21.67255401611328, 22.832185745239258, 23.991817474365234, 25.15144920349121, 26.311080932617188, 27.470714569091797, 28.630346298217773, 29.78997802734375, 30.949609756469727]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 13.0, 7.0, 15.0, 15.0, 12.0, 13.0, 27.0, 22.0, 25.0, 26.0, 19.0, 32.0, 35.0, 33.0, 39.0, 49.0, 41.0, 45.0, 39.0, 50.0, 49.0, 36.0, 39.0, 28.0, 31.0, 32.0, 22.0, 32.0, 21.0, 23.0, 24.0, 15.0, 21.0, 14.0, 10.0, 5.0, 10.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-29.358545303344727, -28.471513748168945, -27.584484100341797, -26.697452545166016, -25.810420989990234, -24.923389434814453, -24.036357879638672, -23.149328231811523, -22.262296676635742, -21.37526512145996, -20.488235473632812, -19.60120391845703, -18.71417236328125, -17.82714080810547, -16.940109252929688, -16.05307960510254, -15.166048049926758, -14.279016494750977, -13.391985893249512, -12.504955291748047, -11.617923736572266, -10.730892181396484, -9.84386157989502, -8.956830978393555, -8.069799423217773, -7.18276834487915, -6.295737266540527, -5.408706188201904, -4.521675109863281, -3.634644031524658, -2.747612953186035, -1.860581874847412, -0.9735527038574219, -0.08652162551879883, 0.8005094528198242, 1.6875405311584473, 2.5745716094970703, 3.4616026878356934, 4.348633766174316, 5.2356648445129395, 6.1226959228515625, 7.0097270011901855, 7.896758079528809, 8.783788681030273, 9.670820236206055, 10.557851791381836, 11.4448823928833, 12.331912994384766, 13.218944549560547, 14.105976104736328, 14.993006706237793, 15.880037307739258, 16.76706886291504, 17.65410041809082, 18.54113006591797, 19.42816162109375, 20.31519317626953, 21.202224731445312, 22.089256286621094, 22.976285934448242, 23.863317489624023, 24.750349044799805, 25.637378692626953, 26.524410247802734, 27.411441802978516]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 17.0, 27.0, 44.0, 49.0, 80.0, 122.0, 136.0, 221.0, 345.0, 466.0, 804.0, 1178.0, 1860.0, 3111.0, 5185.0, 8839.0, 15820.0, 30271.0, 62163.0, 154929.0, 539737.0, 1535579.0, 1229159.0, 379015.0, 117786.0, 50151.0, 24996.0, 13398.0, 7456.0, 4337.0, 2628.0, 1590.0, 986.0, 628.0, 387.0, 255.0, 175.0, 120.0, 64.0, 57.0, 34.0, 26.0, 12.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0], "bins": [-49.65625, -48.30908203125, -46.9619140625, -45.61474609375, -44.267578125, -42.92041015625, -41.5732421875, -40.22607421875, -38.87890625, -37.53173828125, -36.1845703125, -34.83740234375, -33.490234375, -32.14306640625, -30.7958984375, -29.44873046875, -28.1015625, -26.75439453125, -25.4072265625, -24.06005859375, -22.712890625, -21.36572265625, -20.0185546875, -18.67138671875, -17.32421875, -15.97705078125, -14.6298828125, -13.28271484375, -11.935546875, -10.58837890625, -9.2412109375, -7.89404296875, -6.546875, -5.19970703125, -3.8525390625, -2.50537109375, -1.158203125, 0.18896484375, 1.5361328125, 2.88330078125, 4.23046875, 5.57763671875, 6.9248046875, 8.27197265625, 9.619140625, 10.96630859375, 12.3134765625, 13.66064453125, 15.0078125, 16.35498046875, 17.7021484375, 19.04931640625, 20.396484375, 21.74365234375, 23.0908203125, 24.43798828125, 25.78515625, 27.13232421875, 28.4794921875, 29.82666015625, 31.173828125, 32.52099609375, 33.8681640625, 35.21533203125, 36.5625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 6.0, 13.0, 15.0, 14.0, 13.0, 19.0, 21.0, 27.0, 29.0, 18.0, 29.0, 36.0, 40.0, 38.0, 37.0, 35.0, 49.0, 48.0, 49.0, 52.0, 43.0, 48.0, 36.0, 28.0, 31.0, 23.0, 21.0, 26.0, 26.0, 16.0, 17.0, 20.0, 18.0, 12.0, 11.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.84375, -25.05224609375, -24.2607421875, -23.46923828125, -22.677734375, -21.88623046875, -21.0947265625, -20.30322265625, -19.51171875, -18.72021484375, -17.9287109375, -17.13720703125, -16.345703125, -15.55419921875, -14.7626953125, -13.97119140625, -13.1796875, -12.38818359375, -11.5966796875, -10.80517578125, -10.013671875, -9.22216796875, -8.4306640625, -7.63916015625, -6.84765625, -6.05615234375, -5.2646484375, -4.47314453125, -3.681640625, -2.89013671875, -2.0986328125, -1.30712890625, -0.515625, 0.27587890625, 1.0673828125, 1.85888671875, 2.650390625, 3.44189453125, 4.2333984375, 5.02490234375, 5.81640625, 6.60791015625, 7.3994140625, 8.19091796875, 8.982421875, 9.77392578125, 10.5654296875, 11.35693359375, 12.1484375, 12.93994140625, 13.7314453125, 14.52294921875, 15.314453125, 16.10595703125, 16.8974609375, 17.68896484375, 18.48046875, 19.27197265625, 20.0634765625, 20.85498046875, 21.646484375, 22.43798828125, 23.2294921875, 24.02099609375, 24.8125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 9.0, 10.0, 12.0, 14.0, 21.0, 38.0, 55.0, 68.0, 102.0, 154.0, 227.0, 343.0, 557.0, 834.0, 1308.0, 1975.0, 3129.0, 5135.0, 8686.0, 14954.0, 26342.0, 49705.0, 98836.0, 216866.0, 547488.0, 1462841.0, 1051277.0, 377911.0, 159083.0, 75207.0, 38878.0, 21143.0, 12090.0, 7223.0, 4312.0, 2631.0, 1649.0, 1104.0, 711.0, 437.0, 352.0, 192.0, 128.0, 98.0, 43.0, 42.0, 21.0, 24.0, 10.0, 8.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.46875, -39.1552734375, -37.841796875, -36.5283203125, -35.21484375, -33.9013671875, -32.587890625, -31.2744140625, -29.9609375, -28.6474609375, -27.333984375, -26.0205078125, -24.70703125, -23.3935546875, -22.080078125, -20.7666015625, -19.453125, -18.1396484375, -16.826171875, -15.5126953125, -14.19921875, -12.8857421875, -11.572265625, -10.2587890625, -8.9453125, -7.6318359375, -6.318359375, -5.0048828125, -3.69140625, -2.3779296875, -1.064453125, 0.2490234375, 1.5625, 2.8759765625, 4.189453125, 5.5029296875, 6.81640625, 8.1298828125, 9.443359375, 10.7568359375, 12.0703125, 13.3837890625, 14.697265625, 16.0107421875, 17.32421875, 18.6376953125, 19.951171875, 21.2646484375, 22.578125, 23.8916015625, 25.205078125, 26.5185546875, 27.83203125, 29.1455078125, 30.458984375, 31.7724609375, 33.0859375, 34.3994140625, 35.712890625, 37.0263671875, 38.33984375, 39.6533203125, 40.966796875, 42.2802734375, 43.59375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 14.0, 11.0, 17.0, 17.0, 23.0, 43.0, 51.0, 58.0, 56.0, 94.0, 112.0, 165.0, 217.0, 251.0, 324.0, 411.0, 439.0, 369.0, 310.0, 258.0, 183.0, 139.0, 119.0, 91.0, 60.0, 56.0, 41.0, 26.0, 26.0, 12.0, 18.0, 4.0, 9.0, 6.0, 9.0, 7.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.671875, -13.2232666015625, -12.774658203125, -12.3260498046875, -11.87744140625, -11.4288330078125, -10.980224609375, -10.5316162109375, -10.0830078125, -9.6343994140625, -9.185791015625, -8.7371826171875, -8.28857421875, -7.8399658203125, -7.391357421875, -6.9427490234375, -6.494140625, -6.0455322265625, -5.596923828125, -5.1483154296875, -4.69970703125, -4.2510986328125, -3.802490234375, -3.3538818359375, -2.9052734375, -2.4566650390625, -2.008056640625, -1.5594482421875, -1.11083984375, -0.6622314453125, -0.213623046875, 0.2349853515625, 0.68359375, 1.1322021484375, 1.580810546875, 2.0294189453125, 2.47802734375, 2.9266357421875, 3.375244140625, 3.8238525390625, 4.2724609375, 4.7210693359375, 5.169677734375, 5.6182861328125, 6.06689453125, 6.5155029296875, 6.964111328125, 7.4127197265625, 7.861328125, 8.3099365234375, 8.758544921875, 9.2071533203125, 9.65576171875, 10.1043701171875, 10.552978515625, 11.0015869140625, 11.4501953125, 11.8988037109375, 12.347412109375, 12.7960205078125, 13.24462890625, 13.6932373046875, 14.141845703125, 14.5904541015625, 15.0390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 10.0, 20.0, 22.0, 15.0, 34.0, 47.0, 37.0, 35.0, 70.0, 61.0, 78.0, 71.0, 83.0, 68.0, 68.0, 56.0, 43.0, 35.0, 27.0, 20.0, 18.0, 17.0, 12.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.255611419677734, -37.085819244384766, -35.91602325439453, -34.74623107910156, -33.57643508911133, -32.40664291381836, -31.236846923828125, -30.067054748535156, -28.897258758544922, -27.72746467590332, -26.55767059326172, -25.387876510620117, -24.218082427978516, -23.048288345336914, -21.878494262695312, -20.708702087402344, -19.538908004760742, -18.36911392211914, -17.19931983947754, -16.029525756835938, -14.859731674194336, -13.689937591552734, -12.52014446258545, -11.350350379943848, -10.180556297302246, -9.010762214660645, -7.840968132019043, -6.6711745262146, -5.501380443572998, -4.3315863609313965, -3.161792755126953, -1.9919986724853516, -0.82220458984375, 0.347589373588562, 1.517383337020874, 2.6871771812438965, 3.856971263885498, 5.0267653465271, 6.196558952331543, 7.3663530349731445, 8.536147117614746, 9.705941200256348, 10.87573528289795, 12.045528411865234, 13.215322494506836, 14.385116577148438, 15.554910659790039, 16.72470474243164, 17.894498825073242, 19.064292907714844, 20.234086990356445, 21.403881072998047, 22.57367515563965, 23.74346923828125, 24.91326141357422, 26.083057403564453, 27.252849578857422, 28.422643661499023, 29.592437744140625, 30.762231826782227, 31.932025909423828, 33.1018180847168, 34.27161407470703, 35.44140625, 36.611202239990234]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 6.0, 9.0, 18.0, 14.0, 13.0, 23.0, 15.0, 18.0, 28.0, 28.0, 33.0, 25.0, 24.0, 40.0, 31.0, 42.0, 36.0, 35.0, 44.0, 39.0, 44.0, 35.0, 45.0, 43.0, 43.0, 40.0, 27.0, 15.0, 20.0, 36.0, 21.0, 13.0, 14.0, 11.0, 13.0, 11.0, 9.0, 4.0, 4.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.972131729125977, -27.14262580871582, -26.31311798095703, -25.483612060546875, -24.65410614013672, -23.82459831237793, -22.995092391967773, -22.165584564208984, -21.336078643798828, -20.506572723388672, -19.677064895629883, -18.847558975219727, -18.018051147460938, -17.18854522705078, -16.359039306640625, -15.529532432556152, -14.70002555847168, -13.870518684387207, -13.041011810302734, -12.211505889892578, -11.381999015808105, -10.552492141723633, -9.722986221313477, -8.893479347229004, -8.063972473144531, -7.234465599060059, -6.404959201812744, -5.57545280456543, -4.745945930480957, -3.9164390563964844, -3.08693265914917, -2.2574262619018555, -1.4279193878173828, -0.5984127521514893, 0.2310938835144043, 1.0606005191802979, 1.8901071548461914, 2.719614028930664, 3.5491204261779785, 4.378626823425293, 5.208133697509766, 6.037640571594238, 6.867146968841553, 7.696653366088867, 8.52616024017334, 9.355667114257812, 10.185173034667969, 11.014679908752441, 11.844186782836914, 12.673693656921387, 13.50320053100586, 14.332706451416016, 15.162213325500488, 15.991720199584961, 16.821226119995117, 17.650733947753906, 18.480239868164062, 19.30974578857422, 20.139253616333008, 20.968759536743164, 21.798267364501953, 22.62777328491211, 23.457279205322266, 24.286785125732422, 25.11629295349121]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 11.0, 13.0, 11.0, 40.0, 57.0, 71.0, 112.0, 148.0, 282.0, 403.0, 660.0, 978.0, 1592.0, 2518.0, 3827.0, 6479.0, 10157.0, 17138.0, 29844.0, 54302.0, 104605.0, 210993.0, 273010.0, 154197.0, 76789.0, 41323.0, 23243.0, 13595.0, 8291.0, 5007.0, 3311.0, 2010.0, 1297.0, 789.0, 504.0, 323.0, 213.0, 137.0, 87.0, 62.0, 42.0, 24.0, 23.0, 15.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.21875, -23.4443359375, -22.669921875, -21.8955078125, -21.12109375, -20.3466796875, -19.572265625, -18.7978515625, -18.0234375, -17.2490234375, -16.474609375, -15.7001953125, -14.92578125, -14.1513671875, -13.376953125, -12.6025390625, -11.828125, -11.0537109375, -10.279296875, -9.5048828125, -8.73046875, -7.9560546875, -7.181640625, -6.4072265625, -5.6328125, -4.8583984375, -4.083984375, -3.3095703125, -2.53515625, -1.7607421875, -0.986328125, -0.2119140625, 0.5625, 1.3369140625, 2.111328125, 2.8857421875, 3.66015625, 4.4345703125, 5.208984375, 5.9833984375, 6.7578125, 7.5322265625, 8.306640625, 9.0810546875, 9.85546875, 10.6298828125, 11.404296875, 12.1787109375, 12.953125, 13.7275390625, 14.501953125, 15.2763671875, 16.05078125, 16.8251953125, 17.599609375, 18.3740234375, 19.1484375, 19.9228515625, 20.697265625, 21.4716796875, 22.24609375, 23.0205078125, 23.794921875, 24.5693359375, 25.34375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 7.0, 7.0, 11.0, 15.0, 11.0, 22.0, 20.0, 16.0, 22.0, 26.0, 21.0, 24.0, 30.0, 41.0, 30.0, 35.0, 51.0, 36.0, 54.0, 46.0, 52.0, 42.0, 34.0, 55.0, 45.0, 33.0, 33.0, 19.0, 19.0, 29.0, 26.0, 17.0, 16.0, 9.0, 10.0, 12.0, 6.0, 2.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.03125, -29.1220703125, -28.212890625, -27.3037109375, -26.39453125, -25.4853515625, -24.576171875, -23.6669921875, -22.7578125, -21.8486328125, -20.939453125, -20.0302734375, -19.12109375, -18.2119140625, -17.302734375, -16.3935546875, -15.484375, -14.5751953125, -13.666015625, -12.7568359375, -11.84765625, -10.9384765625, -10.029296875, -9.1201171875, -8.2109375, -7.3017578125, -6.392578125, -5.4833984375, -4.57421875, -3.6650390625, -2.755859375, -1.8466796875, -0.9375, -0.0283203125, 0.880859375, 1.7900390625, 2.69921875, 3.6083984375, 4.517578125, 5.4267578125, 6.3359375, 7.2451171875, 8.154296875, 9.0634765625, 9.97265625, 10.8818359375, 11.791015625, 12.7001953125, 13.609375, 14.5185546875, 15.427734375, 16.3369140625, 17.24609375, 18.1552734375, 19.064453125, 19.9736328125, 20.8828125, 21.7919921875, 22.701171875, 23.6103515625, 24.51953125, 25.4287109375, 26.337890625, 27.2470703125, 28.15625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 13.0, 8.0, 13.0, 20.0, 31.0, 28.0, 53.0, 81.0, 90.0, 152.0, 198.0, 325.0, 455.0, 632.0, 959.0, 1420.0, 2204.0, 3270.0, 5262.0, 8152.0, 13313.0, 22071.0, 39399.0, 74392.0, 155012.0, 302880.0, 205408.0, 94305.0, 48727.0, 26908.0, 15764.0, 9438.0, 5960.0, 3918.0, 2451.0, 1656.0, 1114.0, 810.0, 521.0, 376.0, 211.0, 150.0, 135.0, 88.0, 62.0, 34.0, 24.0, 24.0, 9.0, 10.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0], "bins": [-28.65625, -27.75146484375, -26.8466796875, -25.94189453125, -25.037109375, -24.13232421875, -23.2275390625, -22.32275390625, -21.41796875, -20.51318359375, -19.6083984375, -18.70361328125, -17.798828125, -16.89404296875, -15.9892578125, -15.08447265625, -14.1796875, -13.27490234375, -12.3701171875, -11.46533203125, -10.560546875, -9.65576171875, -8.7509765625, -7.84619140625, -6.94140625, -6.03662109375, -5.1318359375, -4.22705078125, -3.322265625, -2.41748046875, -1.5126953125, -0.60791015625, 0.296875, 1.20166015625, 2.1064453125, 3.01123046875, 3.916015625, 4.82080078125, 5.7255859375, 6.63037109375, 7.53515625, 8.43994140625, 9.3447265625, 10.24951171875, 11.154296875, 12.05908203125, 12.9638671875, 13.86865234375, 14.7734375, 15.67822265625, 16.5830078125, 17.48779296875, 18.392578125, 19.29736328125, 20.2021484375, 21.10693359375, 22.01171875, 22.91650390625, 23.8212890625, 24.72607421875, 25.630859375, 26.53564453125, 27.4404296875, 28.34521484375, 29.25]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 10.0, 4.0, 12.0, 9.0, 16.0, 18.0, 15.0, 13.0, 23.0, 25.0, 19.0, 26.0, 33.0, 28.0, 26.0, 38.0, 31.0, 30.0, 41.0, 34.0, 44.0, 41.0, 42.0, 39.0, 34.0, 31.0, 35.0, 32.0, 33.0, 34.0, 24.0, 27.0, 19.0, 19.0, 19.0, 10.0, 11.0, 5.0, 14.0, 6.0, 3.0, 6.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.65625, -14.1484375, -13.640625, -13.1328125, -12.625, -12.1171875, -11.609375, -11.1015625, -10.59375, -10.0859375, -9.578125, -9.0703125, -8.5625, -8.0546875, -7.546875, -7.0390625, -6.53125, -6.0234375, -5.515625, -5.0078125, -4.5, -3.9921875, -3.484375, -2.9765625, -2.46875, -1.9609375, -1.453125, -0.9453125, -0.4375, 0.0703125, 0.578125, 1.0859375, 1.59375, 2.1015625, 2.609375, 3.1171875, 3.625, 4.1328125, 4.640625, 5.1484375, 5.65625, 6.1640625, 6.671875, 7.1796875, 7.6875, 8.1953125, 8.703125, 9.2109375, 9.71875, 10.2265625, 10.734375, 11.2421875, 11.75, 12.2578125, 12.765625, 13.2734375, 13.78125, 14.2890625, 14.796875, 15.3046875, 15.8125, 16.3203125, 16.828125, 17.3359375, 17.84375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 8.0, 11.0, 24.0, 20.0, 41.0, 68.0, 82.0, 117.0, 197.0, 335.0, 528.0, 909.0, 1559.0, 3005.0, 5702.0, 11659.0, 25370.0, 62858.0, 182163.0, 431196.0, 201097.0, 68036.0, 27710.0, 12551.0, 5988.0, 3102.0, 1697.0, 1001.0, 534.0, 340.0, 224.0, 138.0, 76.0, 56.0, 42.0, 27.0, 33.0, 15.0, 13.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.70703125, -11.296875, -10.88671875, -10.4765625, -10.06640625, -9.65625, -9.24609375, -8.8359375, -8.42578125, -8.015625, -7.60546875, -7.1953125, -6.78515625, -6.375, -5.96484375, -5.5546875, -5.14453125, -4.734375, -4.32421875, -3.9140625, -3.50390625, -3.09375, -2.68359375, -2.2734375, -1.86328125, -1.453125, -1.04296875, -0.6328125, -0.22265625, 0.1875, 0.59765625, 1.0078125, 1.41796875, 1.828125, 2.23828125, 2.6484375, 3.05859375, 3.46875, 3.87890625, 4.2890625, 4.69921875, 5.109375, 5.51953125, 5.9296875, 6.33984375, 6.75, 7.16015625, 7.5703125, 7.98046875, 8.390625, 8.80078125, 9.2109375, 9.62109375, 10.03125, 10.44140625, 10.8515625, 11.26171875, 11.671875, 12.08203125, 12.4921875, 12.90234375, 13.3125, 13.72265625, 14.1328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 2.0, 9.0, 9.0, 10.0, 18.0, 23.0, 41.0, 36.0, 37.0, 66.0, 86.0, 108.0, 89.0, 115.0, 93.0, 50.0, 50.0, 44.0, 35.0, 18.0, 14.0, 20.0, 8.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013818740844726562, -0.0013416856527328491, -0.001301497220993042, -0.0012613087892532349, -0.0012211203575134277, -0.0011809319257736206, -0.0011407434940338135, -0.0011005550622940063, -0.0010603666305541992, -0.001020178198814392, -0.000979989767074585, -0.0009398013353347778, -0.0008996129035949707, -0.0008594244718551636, -0.0008192360401153564, -0.0007790476083755493, -0.0007388591766357422, -0.0006986707448959351, -0.0006584823131561279, -0.0006182938814163208, -0.0005781054496765137, -0.0005379170179367065, -0.0004977285861968994, -0.0004575401544570923, -0.00041735172271728516, -0.00037716329097747803, -0.0003369748592376709, -0.00029678642749786377, -0.00025659799575805664, -0.0002164095640182495, -0.00017622113227844238, -0.00013603270053863525, -9.584426879882812e-05, -5.5655837059020996e-05, -1.5467405319213867e-05, 2.4721026420593262e-05, 6.490945816040039e-05, 0.00010509788990020752, 0.00014528632164001465, 0.00018547475337982178, 0.0002256631851196289, 0.00026585161685943604, 0.00030604004859924316, 0.0003462284803390503, 0.0003864169120788574, 0.00042660534381866455, 0.0004667937755584717, 0.0005069822072982788, 0.0005471706390380859, 0.0005873590707778931, 0.0006275475025177002, 0.0006677359342575073, 0.0007079243659973145, 0.0007481127977371216, 0.0007883012294769287, 0.0008284896612167358, 0.000868678092956543, 0.0009088665246963501, 0.0009490549564361572, 0.0009892433881759644, 0.0010294318199157715, 0.0010696202516555786, 0.0011098086833953857, 0.0011499971151351929, 0.001190185546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 14.0, 14.0, 16.0, 26.0, 37.0, 40.0, 74.0, 90.0, 161.0, 207.0, 311.0, 472.0, 739.0, 1183.0, 1844.0, 3029.0, 5032.0, 8606.0, 14913.0, 26812.0, 50837.0, 101220.0, 211750.0, 290174.0, 161745.0, 77637.0, 39747.0, 21536.0, 12099.0, 7020.0, 4257.0, 2455.0, 1576.0, 969.0, 662.0, 412.0, 260.0, 186.0, 110.0, 80.0, 62.0, 40.0, 25.0, 17.0, 15.0, 12.0, 9.0, 5.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.5703125, -10.209716796875, -9.84912109375, -9.488525390625, -9.1279296875, -8.767333984375, -8.40673828125, -8.046142578125, -7.685546875, -7.324951171875, -6.96435546875, -6.603759765625, -6.2431640625, -5.882568359375, -5.52197265625, -5.161376953125, -4.80078125, -4.440185546875, -4.07958984375, -3.718994140625, -3.3583984375, -2.997802734375, -2.63720703125, -2.276611328125, -1.916015625, -1.555419921875, -1.19482421875, -0.834228515625, -0.4736328125, -0.113037109375, 0.24755859375, 0.608154296875, 0.96875, 1.329345703125, 1.68994140625, 2.050537109375, 2.4111328125, 2.771728515625, 3.13232421875, 3.492919921875, 3.853515625, 4.214111328125, 4.57470703125, 4.935302734375, 5.2958984375, 5.656494140625, 6.01708984375, 6.377685546875, 6.73828125, 7.098876953125, 7.45947265625, 7.820068359375, 8.1806640625, 8.541259765625, 8.90185546875, 9.262451171875, 9.623046875, 9.983642578125, 10.34423828125, 10.704833984375, 11.0654296875, 11.426025390625, 11.78662109375, 12.147216796875, 12.5078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 4.0, 8.0, 1.0, 7.0, 7.0, 9.0, 10.0, 15.0, 21.0, 29.0, 29.0, 27.0, 38.0, 46.0, 50.0, 67.0, 61.0, 79.0, 60.0, 64.0, 55.0, 61.0, 52.0, 44.0, 37.0, 27.0, 16.0, 17.0, 21.0, 12.0, 10.0, 7.0, 6.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248046875, -3.131256103515625, -3.01446533203125, -2.897674560546875, -2.7808837890625, -2.664093017578125, -2.54730224609375, -2.430511474609375, -2.313720703125, -2.196929931640625, -2.08013916015625, -1.963348388671875, -1.8465576171875, -1.729766845703125, -1.61297607421875, -1.496185302734375, -1.37939453125, -1.262603759765625, -1.14581298828125, -1.029022216796875, -0.9122314453125, -0.795440673828125, -0.67864990234375, -0.561859130859375, -0.445068359375, -0.328277587890625, -0.21148681640625, -0.094696044921875, 0.0220947265625, 0.138885498046875, 0.25567626953125, 0.372467041015625, 0.4892578125, 0.606048583984375, 0.72283935546875, 0.839630126953125, 0.9564208984375, 1.073211669921875, 1.19000244140625, 1.306793212890625, 1.423583984375, 1.540374755859375, 1.65716552734375, 1.773956298828125, 1.8907470703125, 2.007537841796875, 2.12432861328125, 2.241119384765625, 2.35791015625, 2.474700927734375, 2.59149169921875, 2.708282470703125, 2.8250732421875, 2.941864013671875, 3.05865478515625, 3.175445556640625, 3.292236328125, 3.409027099609375, 3.52581787109375, 3.642608642578125, 3.7593994140625, 3.876190185546875, 3.99298095703125, 4.109771728515625, 4.2265625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 12.0, 13.0, 14.0, 19.0, 22.0, 24.0, 32.0, 39.0, 55.0, 54.0, 59.0, 75.0, 83.0, 86.0, 63.0, 61.0, 52.0, 43.0, 40.0, 30.0, 22.0, 19.0, 14.0, 24.0, 16.0, 10.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.25048828125, -36.11517333984375, -34.9798583984375, -33.84454345703125, -32.709228515625, -31.573911666870117, -30.438594818115234, -29.303279876708984, -28.167964935302734, -27.032649993896484, -25.897335052490234, -24.76201820373535, -23.6267032623291, -22.49138832092285, -21.35607147216797, -20.22075653076172, -19.08544158935547, -17.95012664794922, -16.81481170654297, -15.679494857788086, -14.544179916381836, -13.408864974975586, -12.27354907989502, -11.138233184814453, -10.002918243408203, -8.867603302001953, -7.732287406921387, -6.5969719886779785, -5.46165657043457, -4.326341152191162, -3.191025733947754, -2.0557103157043457, -0.9203987121582031, 0.21491670608520508, 1.3502321243286133, 2.4855475425720215, 3.6208629608154297, 4.756178379058838, 5.891493797302246, 7.026809215545654, 8.162124633789062, 9.297439575195312, 10.432755470275879, 11.568071365356445, 12.703386306762695, 13.838701248168945, 14.974017143249512, 16.109333038330078, 17.244647979736328, 18.379962921142578, 19.515277862548828, 20.65059471130371, 21.78590965270996, 22.92122459411621, 24.056541442871094, 25.191856384277344, 26.327171325683594, 27.462486267089844, 28.597801208496094, 29.733118057250977, 30.868432998657227, 32.00374984741211, 33.13906478881836, 34.27437973022461, 35.40969467163086]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 4.0, 11.0, 11.0, 14.0, 10.0, 14.0, 22.0, 15.0, 15.0, 30.0, 25.0, 21.0, 26.0, 29.0, 34.0, 31.0, 41.0, 42.0, 31.0, 40.0, 43.0, 39.0, 35.0, 40.0, 36.0, 46.0, 45.0, 32.0, 25.0, 19.0, 26.0, 30.0, 17.0, 11.0, 13.0, 15.0, 14.0, 8.0, 6.0, 6.0, 8.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.385093688964844, -25.59136962890625, -24.79764747619629, -24.003923416137695, -23.210201263427734, -22.41647720336914, -21.622753143310547, -20.829030990600586, -20.035308837890625, -19.24158477783203, -18.44786262512207, -17.654138565063477, -16.860416412353516, -16.066692352294922, -15.272969245910645, -14.479246139526367, -13.685522079467773, -12.891798973083496, -12.098075866699219, -11.304351806640625, -10.510629653930664, -9.71690559387207, -8.923182487487793, -8.129459381103516, -7.335736274719238, -6.542013168334961, -5.748290061950684, -4.954566478729248, -4.160843372344971, -3.3671202659606934, -2.573396682739258, -1.7796735763549805, -0.9859504699707031, -0.19222724437713623, 0.6014959812164307, 1.395219326019287, 2.1889424324035645, 2.982665538787842, 3.7763891220092773, 4.570112228393555, 5.363835334777832, 6.157558441162109, 6.951281547546387, 7.745005130767822, 8.538728713989258, 9.332450866699219, 10.126174926757812, 10.91989803314209, 11.713621139526367, 12.507344245910645, 13.301067352294922, 14.094791412353516, 14.888513565063477, 15.68223762512207, 16.47595977783203, 17.269683837890625, 18.06340789794922, 18.857131958007812, 19.650854110717773, 20.444578170776367, 21.238300323486328, 22.032024383544922, 22.825748443603516, 23.619470596313477, 24.413192749023438]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 11.0, 21.0, 15.0, 18.0, 36.0, 66.0, 80.0, 108.0, 156.0, 196.0, 297.0, 463.0, 707.0, 973.0, 1564.0, 2392.0, 3562.0, 5637.0, 9027.0, 14300.0, 23560.0, 39083.0, 66204.0, 111337.0, 173931.0, 204217.0, 153534.0, 94311.0, 55750.0, 32982.0, 19821.0, 12400.0, 7579.0, 4932.0, 3126.0, 2074.0, 1324.0, 880.0, 572.0, 383.0, 306.0, 185.0, 138.0, 83.0, 72.0, 47.0, 29.0, 23.0, 17.0, 17.0, 3.0, 4.0, 2.0, 0.0, 6.0, 4.0, 1.0], "bins": [-34.59375, -33.52392578125, -32.4541015625, -31.38427734375, -30.314453125, -29.24462890625, -28.1748046875, -27.10498046875, -26.03515625, -24.96533203125, -23.8955078125, -22.82568359375, -21.755859375, -20.68603515625, -19.6162109375, -18.54638671875, -17.4765625, -16.40673828125, -15.3369140625, -14.26708984375, -13.197265625, -12.12744140625, -11.0576171875, -9.98779296875, -8.91796875, -7.84814453125, -6.7783203125, -5.70849609375, -4.638671875, -3.56884765625, -2.4990234375, -1.42919921875, -0.359375, 0.71044921875, 1.7802734375, 2.85009765625, 3.919921875, 4.98974609375, 6.0595703125, 7.12939453125, 8.19921875, 9.26904296875, 10.3388671875, 11.40869140625, 12.478515625, 13.54833984375, 14.6181640625, 15.68798828125, 16.7578125, 17.82763671875, 18.8974609375, 19.96728515625, 21.037109375, 22.10693359375, 23.1767578125, 24.24658203125, 25.31640625, 26.38623046875, 27.4560546875, 28.52587890625, 29.595703125, 30.66552734375, 31.7353515625, 32.80517578125, 33.875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 9.0, 7.0, 15.0, 12.0, 10.0, 21.0, 14.0, 18.0, 24.0, 22.0, 26.0, 24.0, 30.0, 30.0, 42.0, 47.0, 35.0, 43.0, 31.0, 38.0, 38.0, 51.0, 41.0, 46.0, 32.0, 44.0, 32.0, 20.0, 25.0, 19.0, 26.0, 29.0, 19.0, 11.0, 13.0, 10.0, 10.0, 4.0, 8.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.046875, -26.2158203125, -25.384765625, -24.5537109375, -23.72265625, -22.8916015625, -22.060546875, -21.2294921875, -20.3984375, -19.5673828125, -18.736328125, -17.9052734375, -17.07421875, -16.2431640625, -15.412109375, -14.5810546875, -13.75, -12.9189453125, -12.087890625, -11.2568359375, -10.42578125, -9.5947265625, -8.763671875, -7.9326171875, -7.1015625, -6.2705078125, -5.439453125, -4.6083984375, -3.77734375, -2.9462890625, -2.115234375, -1.2841796875, -0.453125, 0.3779296875, 1.208984375, 2.0400390625, 2.87109375, 3.7021484375, 4.533203125, 5.3642578125, 6.1953125, 7.0263671875, 7.857421875, 8.6884765625, 9.51953125, 10.3505859375, 11.181640625, 12.0126953125, 12.84375, 13.6748046875, 14.505859375, 15.3369140625, 16.16796875, 16.9990234375, 17.830078125, 18.6611328125, 19.4921875, 20.3232421875, 21.154296875, 21.9853515625, 22.81640625, 23.6474609375, 24.478515625, 25.3095703125, 26.140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 11.0, 10.0, 15.0, 21.0, 42.0, 58.0, 81.0, 104.0, 160.0, 235.0, 336.0, 545.0, 717.0, 1109.0, 1699.0, 2526.0, 3658.0, 5751.0, 8589.0, 13531.0, 21243.0, 33847.0, 54834.0, 89713.0, 140775.0, 185413.0, 171065.0, 117404.0, 72494.0, 44769.0, 27648.0, 17343.0, 11180.0, 7223.0, 4815.0, 3152.0, 2132.0, 1366.0, 905.0, 618.0, 479.0, 311.0, 213.0, 121.0, 90.0, 57.0, 45.0, 34.0, 27.0, 15.0, 13.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-32.59375, -31.568359375, -30.54296875, -29.517578125, -28.4921875, -27.466796875, -26.44140625, -25.416015625, -24.390625, -23.365234375, -22.33984375, -21.314453125, -20.2890625, -19.263671875, -18.23828125, -17.212890625, -16.1875, -15.162109375, -14.13671875, -13.111328125, -12.0859375, -11.060546875, -10.03515625, -9.009765625, -7.984375, -6.958984375, -5.93359375, -4.908203125, -3.8828125, -2.857421875, -1.83203125, -0.806640625, 0.21875, 1.244140625, 2.26953125, 3.294921875, 4.3203125, 5.345703125, 6.37109375, 7.396484375, 8.421875, 9.447265625, 10.47265625, 11.498046875, 12.5234375, 13.548828125, 14.57421875, 15.599609375, 16.625, 17.650390625, 18.67578125, 19.701171875, 20.7265625, 21.751953125, 22.77734375, 23.802734375, 24.828125, 25.853515625, 26.87890625, 27.904296875, 28.9296875, 29.955078125, 30.98046875, 32.005859375, 33.03125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 11.0, 6.0, 21.0, 14.0, 23.0, 25.0, 25.0, 30.0, 30.0, 25.0, 31.0, 39.0, 36.0, 35.0, 36.0, 42.0, 44.0, 39.0, 43.0, 38.0, 34.0, 35.0, 37.0, 32.0, 26.0, 28.0, 27.0, 24.0, 13.0, 14.0, 12.0, 17.0, 15.0, 13.0, 10.0, 8.0, 5.0, 12.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.515625, -16.00146484375, -15.4873046875, -14.97314453125, -14.458984375, -13.94482421875, -13.4306640625, -12.91650390625, -12.40234375, -11.88818359375, -11.3740234375, -10.85986328125, -10.345703125, -9.83154296875, -9.3173828125, -8.80322265625, -8.2890625, -7.77490234375, -7.2607421875, -6.74658203125, -6.232421875, -5.71826171875, -5.2041015625, -4.68994140625, -4.17578125, -3.66162109375, -3.1474609375, -2.63330078125, -2.119140625, -1.60498046875, -1.0908203125, -0.57666015625, -0.0625, 0.45166015625, 0.9658203125, 1.47998046875, 1.994140625, 2.50830078125, 3.0224609375, 3.53662109375, 4.05078125, 4.56494140625, 5.0791015625, 5.59326171875, 6.107421875, 6.62158203125, 7.1357421875, 7.64990234375, 8.1640625, 8.67822265625, 9.1923828125, 9.70654296875, 10.220703125, 10.73486328125, 11.2490234375, 11.76318359375, 12.27734375, 12.79150390625, 13.3056640625, 13.81982421875, 14.333984375, 14.84814453125, 15.3623046875, 15.87646484375, 16.390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 12.0, 17.0, 26.0, 33.0, 65.0, 92.0, 140.0, 216.0, 314.0, 512.0, 898.0, 1341.0, 2109.0, 3410.0, 5805.0, 10145.0, 18105.0, 34563.0, 71358.0, 154123.0, 275540.0, 236089.0, 117056.0, 54267.0, 27059.0, 14440.0, 8170.0, 4831.0, 2901.0, 1765.0, 1139.0, 721.0, 462.0, 280.0, 197.0, 113.0, 78.0, 50.0, 43.0, 22.0, 7.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.9609375, -12.5535888671875, -12.146240234375, -11.7388916015625, -11.33154296875, -10.9241943359375, -10.516845703125, -10.1094970703125, -9.7021484375, -9.2947998046875, -8.887451171875, -8.4801025390625, -8.07275390625, -7.6654052734375, -7.258056640625, -6.8507080078125, -6.443359375, -6.0360107421875, -5.628662109375, -5.2213134765625, -4.81396484375, -4.4066162109375, -3.999267578125, -3.5919189453125, -3.1845703125, -2.7772216796875, -2.369873046875, -1.9625244140625, -1.55517578125, -1.1478271484375, -0.740478515625, -0.3331298828125, 0.07421875, 0.4815673828125, 0.888916015625, 1.2962646484375, 1.70361328125, 2.1109619140625, 2.518310546875, 2.9256591796875, 3.3330078125, 3.7403564453125, 4.147705078125, 4.5550537109375, 4.96240234375, 5.3697509765625, 5.777099609375, 6.1844482421875, 6.591796875, 6.9991455078125, 7.406494140625, 7.8138427734375, 8.22119140625, 8.6285400390625, 9.035888671875, 9.4432373046875, 9.8505859375, 10.2579345703125, 10.665283203125, 11.0726318359375, 11.47998046875, 11.8873291015625, 12.294677734375, 12.7020263671875, 13.109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 0.0, 6.0, 8.0, 17.0, 13.0, 18.0, 43.0, 42.0, 65.0, 90.0, 112.0, 137.0, 124.0, 96.0, 63.0, 49.0, 33.0, 21.0, 15.0, 15.0, 8.0, 8.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00164794921875, -0.0015880763530731201, -0.0015282034873962402, -0.0014683306217193604, -0.0014084577560424805, -0.0013485848903656006, -0.0012887120246887207, -0.0012288391590118408, -0.001168966293334961, -0.001109093427658081, -0.0010492205619812012, -0.0009893476963043213, -0.0009294748306274414, -0.0008696019649505615, -0.0008097290992736816, -0.0007498562335968018, -0.0006899833679199219, -0.000630110502243042, -0.0005702376365661621, -0.0005103647708892822, -0.00045049190521240234, -0.00039061903953552246, -0.0003307461738586426, -0.0002708733081817627, -0.0002110004425048828, -0.00015112757682800293, -9.125471115112305e-05, -3.1381845474243164e-05, 2.849102020263672e-05, 8.83638858795166e-05, 0.00014823675155639648, 0.00020810961723327637, 0.00026798248291015625, 0.00032785534858703613, 0.000387728214263916, 0.0004476010799407959, 0.0005074739456176758, 0.0005673468112945557, 0.0006272196769714355, 0.0006870925426483154, 0.0007469654083251953, 0.0008068382740020752, 0.0008667111396789551, 0.000926584005355835, 0.0009864568710327148, 0.0010463297367095947, 0.0011062026023864746, 0.0011660754680633545, 0.0012259483337402344, 0.0012858211994171143, 0.0013456940650939941, 0.001405566930770874, 0.001465439796447754, 0.0015253126621246338, 0.0015851855278015137, 0.0016450583934783936, 0.0017049312591552734, 0.0017648041248321533, 0.0018246769905090332, 0.001884549856185913, 0.001944422721862793, 0.002004295587539673, 0.0020641684532165527, 0.0021240413188934326, 0.0021839141845703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 0.0, 6.0, 5.0, 5.0, 16.0, 26.0, 45.0, 70.0, 112.0, 150.0, 263.0, 365.0, 639.0, 870.0, 1484.0, 2409.0, 3989.0, 6755.0, 12309.0, 23693.0, 48522.0, 105058.0, 219719.0, 289671.0, 172236.0, 79897.0, 37345.0, 18603.0, 10065.0, 5497.0, 3287.0, 2049.0, 1265.0, 732.0, 536.0, 290.0, 204.0, 126.0, 89.0, 61.0, 41.0, 18.0, 15.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.6737060546875, -11.230224609375, -10.7867431640625, -10.34326171875, -9.8997802734375, -9.456298828125, -9.0128173828125, -8.5693359375, -8.1258544921875, -7.682373046875, -7.2388916015625, -6.79541015625, -6.3519287109375, -5.908447265625, -5.4649658203125, -5.021484375, -4.5780029296875, -4.134521484375, -3.6910400390625, -3.24755859375, -2.8040771484375, -2.360595703125, -1.9171142578125, -1.4736328125, -1.0301513671875, -0.586669921875, -0.1431884765625, 0.30029296875, 0.7437744140625, 1.187255859375, 1.6307373046875, 2.07421875, 2.5177001953125, 2.961181640625, 3.4046630859375, 3.84814453125, 4.2916259765625, 4.735107421875, 5.1785888671875, 5.6220703125, 6.0655517578125, 6.509033203125, 6.9525146484375, 7.39599609375, 7.8394775390625, 8.282958984375, 8.7264404296875, 9.169921875, 9.6134033203125, 10.056884765625, 10.5003662109375, 10.94384765625, 11.3873291015625, 11.830810546875, 12.2742919921875, 12.7177734375, 13.1612548828125, 13.604736328125, 14.0482177734375, 14.49169921875, 14.9351806640625, 15.378662109375, 15.8221435546875, 16.265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 1.0, 4.0, 11.0, 6.0, 7.0, 6.0, 13.0, 20.0, 16.0, 20.0, 35.0, 27.0, 32.0, 42.0, 37.0, 59.0, 73.0, 57.0, 61.0, 70.0, 66.0, 55.0, 54.0, 42.0, 30.0, 27.0, 25.0, 17.0, 23.0, 14.0, 9.0, 9.0, 8.0, 4.0, 5.0, 9.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05078125, -2.93927001953125, -2.8277587890625, -2.71624755859375, -2.604736328125, -2.49322509765625, -2.3817138671875, -2.27020263671875, -2.15869140625, -2.04718017578125, -1.9356689453125, -1.82415771484375, -1.712646484375, -1.60113525390625, -1.4896240234375, -1.37811279296875, -1.2666015625, -1.15509033203125, -1.0435791015625, -0.93206787109375, -0.820556640625, -0.70904541015625, -0.5975341796875, -0.48602294921875, -0.37451171875, -0.26300048828125, -0.1514892578125, -0.03997802734375, 0.071533203125, 0.18304443359375, 0.2945556640625, 0.40606689453125, 0.517578125, 0.62908935546875, 0.7406005859375, 0.85211181640625, 0.963623046875, 1.07513427734375, 1.1866455078125, 1.29815673828125, 1.40966796875, 1.52117919921875, 1.6326904296875, 1.74420166015625, 1.855712890625, 1.96722412109375, 2.0787353515625, 2.19024658203125, 2.3017578125, 2.41326904296875, 2.5247802734375, 2.63629150390625, 2.747802734375, 2.85931396484375, 2.9708251953125, 3.08233642578125, 3.19384765625, 3.30535888671875, 3.4168701171875, 3.52838134765625, 3.639892578125, 3.75140380859375, 3.8629150390625, 3.97442626953125, 4.0859375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 9.0, 5.0, 15.0, 16.0, 24.0, 30.0, 36.0, 39.0, 61.0, 60.0, 75.0, 59.0, 88.0, 73.0, 60.0, 71.0, 49.0, 38.0, 42.0, 28.0, 23.0, 26.0, 17.0, 12.0, 10.0, 6.0, 5.0, 4.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.118370056152344, -42.949161529541016, -41.77995300292969, -40.610748291015625, -39.4415397644043, -38.27233123779297, -37.10312271118164, -35.93391418457031, -34.76470947265625, -33.59550094604492, -32.426292419433594, -31.2570858001709, -30.087879180908203, -28.918670654296875, -27.749462127685547, -26.58025550842285, -25.411046981811523, -24.241838455200195, -23.0726318359375, -21.903423309326172, -20.734216690063477, -19.56500816345215, -18.395801544189453, -17.226593017578125, -16.057384490966797, -14.888176918029785, -13.718969345092773, -12.549760818481445, -11.38055419921875, -10.211345672607422, -9.04213809967041, -7.872930526733398, -6.70372200012207, -5.534514427185059, -4.365306854248047, -3.196098804473877, -2.0268912315368652, -0.8576836585998535, 0.3115243911743164, 1.4807319641113281, 2.64993953704834, 3.8191471099853516, 4.988354682922363, 6.157562732696533, 7.326770305633545, 8.495977401733398, 9.665185928344727, 10.834393501281738, 12.00360107421875, 13.172808647155762, 14.342016220092773, 15.511224746704102, 16.680431365966797, 17.849639892578125, 19.018848419189453, 20.18805503845215, 21.357261657714844, 22.526470184326172, 23.695676803588867, 24.864885330200195, 26.03409194946289, 27.20330047607422, 28.372509002685547, 29.541715621948242, 30.71092414855957]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 10.0, 10.0, 4.0, 12.0, 15.0, 15.0, 15.0, 15.0, 10.0, 23.0, 24.0, 27.0, 32.0, 32.0, 37.0, 28.0, 38.0, 38.0, 30.0, 21.0, 38.0, 37.0, 43.0, 40.0, 39.0, 41.0, 29.0, 29.0, 31.0, 29.0, 29.0, 24.0, 19.0, 21.0, 12.0, 15.0, 9.0, 10.0, 18.0, 4.0, 5.0, 3.0, 11.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.878774642944336, -24.09693145751953, -23.315088272094727, -22.533245086669922, -21.751399993896484, -20.96955680847168, -20.187713623046875, -19.40587043762207, -18.624027252197266, -17.84218406677246, -17.060340881347656, -16.27849578857422, -15.496652603149414, -14.71480941772461, -13.932966232299805, -13.151123046875, -12.369277954101562, -11.587434768676758, -10.805590629577637, -10.023747444152832, -9.241903305053711, -8.460060119628906, -7.678216934204102, -6.896373271942139, -6.114529609680176, -5.332685947418213, -4.55084228515625, -3.7689990997314453, -2.9871554374694824, -2.2053117752075195, -1.4234685897827148, -0.641624927520752, 0.14022064208984375, 0.9220641851425171, 1.7039077281951904, 2.485751152038574, 3.267594814300537, 4.0494384765625, 4.831281661987305, 5.613125324249268, 6.3949689865112305, 7.176812648773193, 7.958656311035156, 8.740499496459961, 9.522342681884766, 10.304186820983887, 11.086030006408691, 11.867874145507812, 12.649717330932617, 13.431560516357422, 14.213404655456543, 14.995247840881348, 15.777091979980469, 16.558935165405273, 17.340778350830078, 18.122621536254883, 18.904464721679688, 19.686307907104492, 20.468151092529297, 21.249996185302734, 22.03183937072754, 22.813682556152344, 23.59552574157715, 24.377368927001953, 25.15921401977539]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 6.0, 15.0, 18.0, 23.0, 35.0, 39.0, 69.0, 101.0, 116.0, 158.0, 247.0, 353.0, 500.0, 694.0, 1040.0, 1593.0, 2468.0, 3790.0, 6468.0, 10965.0, 19271.0, 35639.0, 71373.0, 166347.0, 493834.0, 1277056.0, 1271683.0, 500511.0, 175041.0, 73067.0, 35833.0, 18963.0, 10621.0, 6055.0, 3705.0, 2222.0, 1443.0, 931.0, 637.0, 435.0, 261.0, 183.0, 141.0, 104.0, 77.0, 46.0, 27.0, 28.0, 20.0, 7.0, 12.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.53125, -37.36376953125, -36.1962890625, -35.02880859375, -33.861328125, -32.69384765625, -31.5263671875, -30.35888671875, -29.19140625, -28.02392578125, -26.8564453125, -25.68896484375, -24.521484375, -23.35400390625, -22.1865234375, -21.01904296875, -19.8515625, -18.68408203125, -17.5166015625, -16.34912109375, -15.181640625, -14.01416015625, -12.8466796875, -11.67919921875, -10.51171875, -9.34423828125, -8.1767578125, -7.00927734375, -5.841796875, -4.67431640625, -3.5068359375, -2.33935546875, -1.171875, -0.00439453125, 1.1630859375, 2.33056640625, 3.498046875, 4.66552734375, 5.8330078125, 7.00048828125, 8.16796875, 9.33544921875, 10.5029296875, 11.67041015625, 12.837890625, 14.00537109375, 15.1728515625, 16.34033203125, 17.5078125, 18.67529296875, 19.8427734375, 21.01025390625, 22.177734375, 23.34521484375, 24.5126953125, 25.68017578125, 26.84765625, 28.01513671875, 29.1826171875, 30.35009765625, 31.517578125, 32.68505859375, 33.8525390625, 35.02001953125, 36.1875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 4.0, 6.0, 6.0, 7.0, 7.0, 4.0, 12.0, 7.0, 19.0, 11.0, 14.0, 17.0, 22.0, 24.0, 23.0, 38.0, 38.0, 30.0, 44.0, 39.0, 30.0, 36.0, 35.0, 34.0, 41.0, 36.0, 48.0, 43.0, 37.0, 43.0, 32.0, 21.0, 22.0, 26.0, 22.0, 21.0, 12.0, 16.0, 14.0, 15.0, 5.0, 16.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.140625, -22.42431640625, -21.7080078125, -20.99169921875, -20.275390625, -19.55908203125, -18.8427734375, -18.12646484375, -17.41015625, -16.69384765625, -15.9775390625, -15.26123046875, -14.544921875, -13.82861328125, -13.1123046875, -12.39599609375, -11.6796875, -10.96337890625, -10.2470703125, -9.53076171875, -8.814453125, -8.09814453125, -7.3818359375, -6.66552734375, -5.94921875, -5.23291015625, -4.5166015625, -3.80029296875, -3.083984375, -2.36767578125, -1.6513671875, -0.93505859375, -0.21875, 0.49755859375, 1.2138671875, 1.93017578125, 2.646484375, 3.36279296875, 4.0791015625, 4.79541015625, 5.51171875, 6.22802734375, 6.9443359375, 7.66064453125, 8.376953125, 9.09326171875, 9.8095703125, 10.52587890625, 11.2421875, 11.95849609375, 12.6748046875, 13.39111328125, 14.107421875, 14.82373046875, 15.5400390625, 16.25634765625, 16.97265625, 17.68896484375, 18.4052734375, 19.12158203125, 19.837890625, 20.55419921875, 21.2705078125, 21.98681640625, 22.703125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 2.0, 15.0, 14.0, 26.0, 41.0, 67.0, 101.0, 135.0, 247.0, 344.0, 513.0, 820.0, 1189.0, 1870.0, 3061.0, 5018.0, 8260.0, 13816.0, 24881.0, 47202.0, 97556.0, 223215.0, 576722.0, 1513856.0, 1012689.0, 363797.0, 148805.0, 68519.0, 34579.0, 18873.0, 10733.0, 6376.0, 3941.0, 2571.0, 1553.0, 1001.0, 631.0, 426.0, 250.0, 189.0, 136.0, 73.0, 44.0, 33.0, 31.0, 22.0, 13.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-47.34375, -45.98193359375, -44.6201171875, -43.25830078125, -41.896484375, -40.53466796875, -39.1728515625, -37.81103515625, -36.44921875, -35.08740234375, -33.7255859375, -32.36376953125, -31.001953125, -29.64013671875, -28.2783203125, -26.91650390625, -25.5546875, -24.19287109375, -22.8310546875, -21.46923828125, -20.107421875, -18.74560546875, -17.3837890625, -16.02197265625, -14.66015625, -13.29833984375, -11.9365234375, -10.57470703125, -9.212890625, -7.85107421875, -6.4892578125, -5.12744140625, -3.765625, -2.40380859375, -1.0419921875, 0.31982421875, 1.681640625, 3.04345703125, 4.4052734375, 5.76708984375, 7.12890625, 8.49072265625, 9.8525390625, 11.21435546875, 12.576171875, 13.93798828125, 15.2998046875, 16.66162109375, 18.0234375, 19.38525390625, 20.7470703125, 22.10888671875, 23.470703125, 24.83251953125, 26.1943359375, 27.55615234375, 28.91796875, 30.27978515625, 31.6416015625, 33.00341796875, 34.365234375, 35.72705078125, 37.0888671875, 38.45068359375, 39.8125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 5.0, 14.0, 9.0, 9.0, 21.0, 17.0, 39.0, 46.0, 68.0, 68.0, 84.0, 106.0, 128.0, 204.0, 233.0, 318.0, 367.0, 429.0, 401.0, 344.0, 259.0, 199.0, 167.0, 110.0, 89.0, 63.0, 49.0, 51.0, 29.0, 23.0, 21.0, 23.0, 18.0, 9.0, 9.0, 13.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.109375, -13.663818359375, -13.21826171875, -12.772705078125, -12.3271484375, -11.881591796875, -11.43603515625, -10.990478515625, -10.544921875, -10.099365234375, -9.65380859375, -9.208251953125, -8.7626953125, -8.317138671875, -7.87158203125, -7.426025390625, -6.98046875, -6.534912109375, -6.08935546875, -5.643798828125, -5.1982421875, -4.752685546875, -4.30712890625, -3.861572265625, -3.416015625, -2.970458984375, -2.52490234375, -2.079345703125, -1.6337890625, -1.188232421875, -0.74267578125, -0.297119140625, 0.1484375, 0.593994140625, 1.03955078125, 1.485107421875, 1.9306640625, 2.376220703125, 2.82177734375, 3.267333984375, 3.712890625, 4.158447265625, 4.60400390625, 5.049560546875, 5.4951171875, 5.940673828125, 6.38623046875, 6.831787109375, 7.27734375, 7.722900390625, 8.16845703125, 8.614013671875, 9.0595703125, 9.505126953125, 9.95068359375, 10.396240234375, 10.841796875, 11.287353515625, 11.73291015625, 12.178466796875, 12.6240234375, 13.069580078125, 13.51513671875, 13.960693359375, 14.40625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 8.0, 8.0, 12.0, 10.0, 24.0, 16.0, 26.0, 29.0, 38.0, 39.0, 40.0, 65.0, 70.0, 90.0, 81.0, 68.0, 73.0, 56.0, 43.0, 44.0, 36.0, 29.0, 27.0, 14.0, 11.0, 6.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.50014877319336, -39.3203010559082, -38.14045715332031, -36.960609436035156, -35.78076171875, -34.600914001464844, -33.42106628417969, -32.2412223815918, -31.06137466430664, -29.881526947021484, -28.70168113708496, -27.521835327148438, -26.34198760986328, -25.162139892578125, -23.9822940826416, -22.802448272705078, -21.622600555419922, -20.442752838134766, -19.262907028198242, -18.08306121826172, -16.903213500976562, -15.723366737365723, -14.543519973754883, -13.363673210144043, -12.183826446533203, -11.003979682922363, -9.824132919311523, -8.644286155700684, -7.464439392089844, -6.284592628479004, -5.104745864868164, -3.924899101257324, -2.7450523376464844, -1.5652055740356445, -0.3853588104248047, 0.7944879531860352, 1.974334716796875, 3.154181480407715, 4.334028244018555, 5.5138750076293945, 6.693721771240234, 7.873568534851074, 9.053415298461914, 10.233262062072754, 11.413108825683594, 12.592955589294434, 13.772802352905273, 14.952649116516113, 16.132495880126953, 17.31234359741211, 18.492189407348633, 19.672035217285156, 20.851882934570312, 22.03173065185547, 23.211576461791992, 24.391422271728516, 25.571269989013672, 26.751117706298828, 27.93096351623535, 29.110809326171875, 30.29065704345703, 31.470504760742188, 32.650352478027344, 33.830196380615234, 35.01004409790039]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 2.0, 6.0, 9.0, 5.0, 9.0, 9.0, 7.0, 14.0, 13.0, 19.0, 15.0, 20.0, 22.0, 19.0, 30.0, 39.0, 36.0, 27.0, 26.0, 47.0, 39.0, 43.0, 47.0, 39.0, 28.0, 38.0, 44.0, 42.0, 38.0, 20.0, 32.0, 28.0, 20.0, 29.0, 19.0, 18.0, 16.0, 19.0, 12.0, 14.0, 9.0, 7.0, 8.0, 4.0, 5.0, 0.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.00770378112793, -26.189672470092773, -25.37164306640625, -24.553611755371094, -23.735580444335938, -22.917551040649414, -22.099519729614258, -21.281490325927734, -20.463459014892578, -19.645427703857422, -18.8273983001709, -18.009366989135742, -17.19133758544922, -16.373306274414062, -15.555274963378906, -14.737244606018066, -13.919214248657227, -13.101183891296387, -12.283153533935547, -11.46512222290039, -10.64709186553955, -9.829061508178711, -9.011030197143555, -8.192999839782715, -7.374969482421875, -6.556939125061035, -5.738908290863037, -4.920877456665039, -4.102847099304199, -3.2848167419433594, -2.4667859077453613, -1.6487550735473633, -0.8307228088378906, -0.01269221305847168, 0.8053383827209473, 1.6233689785003662, 2.441399574279785, 3.259429931640625, 4.077460765838623, 4.895491600036621, 5.713521957397461, 6.531552314758301, 7.349583148956299, 8.167613983154297, 8.985644340515137, 9.803674697875977, 10.621706008911133, 11.439736366271973, 12.257766723632812, 13.075797080993652, 13.893827438354492, 14.711858749389648, 15.529889106750488, 16.347919464111328, 17.165950775146484, 17.98398208618164, 18.802011489868164, 19.62004280090332, 20.438072204589844, 21.256103515625, 22.074134826660156, 22.89216423034668, 23.710195541381836, 24.52822494506836, 25.346256256103516]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 1.0, 14.0, 13.0, 21.0, 31.0, 47.0, 50.0, 94.0, 140.0, 221.0, 352.0, 499.0, 779.0, 1235.0, 1989.0, 3218.0, 5306.0, 9033.0, 15735.0, 28390.0, 54843.0, 112559.0, 234187.0, 281370.0, 146667.0, 69528.0, 35559.0, 19205.0, 10934.0, 6299.0, 3764.0, 2385.0, 1457.0, 897.0, 579.0, 408.0, 259.0, 157.0, 115.0, 76.0, 44.0, 33.0, 28.0, 7.0, 9.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.109375, -23.282958984375, -22.45654296875, -21.630126953125, -20.8037109375, -19.977294921875, -19.15087890625, -18.324462890625, -17.498046875, -16.671630859375, -15.84521484375, -15.018798828125, -14.1923828125, -13.365966796875, -12.53955078125, -11.713134765625, -10.88671875, -10.060302734375, -9.23388671875, -8.407470703125, -7.5810546875, -6.754638671875, -5.92822265625, -5.101806640625, -4.275390625, -3.448974609375, -2.62255859375, -1.796142578125, -0.9697265625, -0.143310546875, 0.68310546875, 1.509521484375, 2.3359375, 3.162353515625, 3.98876953125, 4.815185546875, 5.6416015625, 6.468017578125, 7.29443359375, 8.120849609375, 8.947265625, 9.773681640625, 10.60009765625, 11.426513671875, 12.2529296875, 13.079345703125, 13.90576171875, 14.732177734375, 15.55859375, 16.385009765625, 17.21142578125, 18.037841796875, 18.8642578125, 19.690673828125, 20.51708984375, 21.343505859375, 22.169921875, 22.996337890625, 23.82275390625, 24.649169921875, 25.4755859375, 26.302001953125, 27.12841796875, 27.954833984375, 28.78125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 9.0, 9.0, 12.0, 10.0, 14.0, 11.0, 13.0, 13.0, 24.0, 17.0, 18.0, 26.0, 31.0, 30.0, 38.0, 40.0, 51.0, 38.0, 36.0, 47.0, 36.0, 23.0, 50.0, 40.0, 44.0, 35.0, 39.0, 29.0, 37.0, 24.0, 27.0, 22.0, 20.0, 10.0, 18.0, 12.0, 6.0, 4.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.75, -26.885498046875, -26.02099609375, -25.156494140625, -24.2919921875, -23.427490234375, -22.56298828125, -21.698486328125, -20.833984375, -19.969482421875, -19.10498046875, -18.240478515625, -17.3759765625, -16.511474609375, -15.64697265625, -14.782470703125, -13.91796875, -13.053466796875, -12.18896484375, -11.324462890625, -10.4599609375, -9.595458984375, -8.73095703125, -7.866455078125, -7.001953125, -6.137451171875, -5.27294921875, -4.408447265625, -3.5439453125, -2.679443359375, -1.81494140625, -0.950439453125, -0.0859375, 0.778564453125, 1.64306640625, 2.507568359375, 3.3720703125, 4.236572265625, 5.10107421875, 5.965576171875, 6.830078125, 7.694580078125, 8.55908203125, 9.423583984375, 10.2880859375, 11.152587890625, 12.01708984375, 12.881591796875, 13.74609375, 14.610595703125, 15.47509765625, 16.339599609375, 17.2041015625, 18.068603515625, 18.93310546875, 19.797607421875, 20.662109375, 21.526611328125, 22.39111328125, 23.255615234375, 24.1201171875, 24.984619140625, 25.84912109375, 26.713623046875, 27.578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 11.0, 7.0, 13.0, 15.0, 28.0, 39.0, 53.0, 73.0, 124.0, 139.0, 184.0, 307.0, 413.0, 557.0, 887.0, 1253.0, 1956.0, 3020.0, 4691.0, 7591.0, 12507.0, 21374.0, 38597.0, 73828.0, 161121.0, 316051.0, 203853.0, 90588.0, 45469.0, 25069.0, 14428.0, 8731.0, 5290.0, 3469.0, 2154.0, 1461.0, 974.0, 680.0, 490.0, 294.0, 214.0, 149.0, 113.0, 81.0, 60.0, 42.0, 28.0, 23.0, 11.0, 9.0, 12.0, 11.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-30.71875, -29.747802734375, -28.77685546875, -27.805908203125, -26.8349609375, -25.864013671875, -24.89306640625, -23.922119140625, -22.951171875, -21.980224609375, -21.00927734375, -20.038330078125, -19.0673828125, -18.096435546875, -17.12548828125, -16.154541015625, -15.18359375, -14.212646484375, -13.24169921875, -12.270751953125, -11.2998046875, -10.328857421875, -9.35791015625, -8.386962890625, -7.416015625, -6.445068359375, -5.47412109375, -4.503173828125, -3.5322265625, -2.561279296875, -1.59033203125, -0.619384765625, 0.3515625, 1.322509765625, 2.29345703125, 3.264404296875, 4.2353515625, 5.206298828125, 6.17724609375, 7.148193359375, 8.119140625, 9.090087890625, 10.06103515625, 11.031982421875, 12.0029296875, 12.973876953125, 13.94482421875, 14.915771484375, 15.88671875, 16.857666015625, 17.82861328125, 18.799560546875, 19.7705078125, 20.741455078125, 21.71240234375, 22.683349609375, 23.654296875, 24.625244140625, 25.59619140625, 26.567138671875, 27.5380859375, 28.509033203125, 29.47998046875, 30.450927734375, 31.421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 8.0, 7.0, 7.0, 12.0, 4.0, 21.0, 11.0, 18.0, 15.0, 18.0, 21.0, 23.0, 26.0, 32.0, 28.0, 29.0, 27.0, 41.0, 43.0, 38.0, 36.0, 36.0, 29.0, 37.0, 38.0, 35.0, 39.0, 44.0, 34.0, 29.0, 23.0, 31.0, 20.0, 16.0, 20.0, 20.0, 18.0, 12.0, 9.0, 7.0, 6.0, 8.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-17.03125, -16.510498046875, -15.98974609375, -15.468994140625, -14.9482421875, -14.427490234375, -13.90673828125, -13.385986328125, -12.865234375, -12.344482421875, -11.82373046875, -11.302978515625, -10.7822265625, -10.261474609375, -9.74072265625, -9.219970703125, -8.69921875, -8.178466796875, -7.65771484375, -7.136962890625, -6.6162109375, -6.095458984375, -5.57470703125, -5.053955078125, -4.533203125, -4.012451171875, -3.49169921875, -2.970947265625, -2.4501953125, -1.929443359375, -1.40869140625, -0.887939453125, -0.3671875, 0.153564453125, 0.67431640625, 1.195068359375, 1.7158203125, 2.236572265625, 2.75732421875, 3.278076171875, 3.798828125, 4.319580078125, 4.84033203125, 5.361083984375, 5.8818359375, 6.402587890625, 6.92333984375, 7.444091796875, 7.96484375, 8.485595703125, 9.00634765625, 9.527099609375, 10.0478515625, 10.568603515625, 11.08935546875, 11.610107421875, 12.130859375, 12.651611328125, 13.17236328125, 13.693115234375, 14.2138671875, 14.734619140625, 15.25537109375, 15.776123046875, 16.296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 7.0, 8.0, 8.0, 13.0, 17.0, 16.0, 28.0, 35.0, 69.0, 73.0, 104.0, 153.0, 226.0, 293.0, 494.0, 674.0, 1014.0, 1632.0, 2551.0, 4373.0, 8143.0, 16482.0, 38717.0, 108711.0, 345287.0, 338790.0, 106200.0, 38250.0, 16362.0, 8053.0, 4461.0, 2539.0, 1591.0, 983.0, 680.0, 417.0, 301.0, 231.0, 155.0, 125.0, 86.0, 50.0, 39.0, 29.0, 24.0, 21.0, 11.0, 7.0, 6.0, 10.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-12.3828125, -11.9957275390625, -11.608642578125, -11.2215576171875, -10.83447265625, -10.4473876953125, -10.060302734375, -9.6732177734375, -9.2861328125, -8.8990478515625, -8.511962890625, -8.1248779296875, -7.73779296875, -7.3507080078125, -6.963623046875, -6.5765380859375, -6.189453125, -5.8023681640625, -5.415283203125, -5.0281982421875, -4.64111328125, -4.2540283203125, -3.866943359375, -3.4798583984375, -3.0927734375, -2.7056884765625, -2.318603515625, -1.9315185546875, -1.54443359375, -1.1573486328125, -0.770263671875, -0.3831787109375, 0.00390625, 0.3909912109375, 0.778076171875, 1.1651611328125, 1.55224609375, 1.9393310546875, 2.326416015625, 2.7135009765625, 3.1005859375, 3.4876708984375, 3.874755859375, 4.2618408203125, 4.64892578125, 5.0360107421875, 5.423095703125, 5.8101806640625, 6.197265625, 6.5843505859375, 6.971435546875, 7.3585205078125, 7.74560546875, 8.1326904296875, 8.519775390625, 8.9068603515625, 9.2939453125, 9.6810302734375, 10.068115234375, 10.4552001953125, 10.84228515625, 11.2293701171875, 11.616455078125, 12.0035400390625, 12.390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 6.0, 6.0, 21.0, 15.0, 22.0, 40.0, 58.0, 85.0, 90.0, 123.0, 131.0, 109.0, 78.0, 62.0, 28.0, 31.0, 16.0, 18.0, 8.0, 17.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001354217529296875, -0.0013121068477630615, -0.001269996166229248, -0.0012278854846954346, -0.001185774803161621, -0.0011436641216278076, -0.0011015534400939941, -0.0010594427585601807, -0.0010173320770263672, -0.0009752213954925537, -0.0009331107139587402, -0.0008910000324249268, -0.0008488893508911133, -0.0008067786693572998, -0.0007646679878234863, -0.0007225573062896729, -0.0006804466247558594, -0.0006383359432220459, -0.0005962252616882324, -0.0005541145801544189, -0.0005120038986206055, -0.000469893217086792, -0.0004277825355529785, -0.00038567185401916504, -0.00034356117248535156, -0.0003014504909515381, -0.0002593398094177246, -0.00021722912788391113, -0.00017511844635009766, -0.00013300776481628418, -9.08970832824707e-05, -4.8786401748657227e-05, -6.67572021484375e-06, 3.5434961318969727e-05, 7.75456428527832e-05, 0.00011965632438659668, 0.00016176700592041016, 0.00020387768745422363, 0.0002459883689880371, 0.0002880990505218506, 0.00033020973205566406, 0.00037232041358947754, 0.000414431095123291, 0.0004565417766571045, 0.000498652458190918, 0.0005407631397247314, 0.0005828738212585449, 0.0006249845027923584, 0.0006670951843261719, 0.0007092058658599854, 0.0007513165473937988, 0.0007934272289276123, 0.0008355379104614258, 0.0008776485919952393, 0.0009197592735290527, 0.0009618699550628662, 0.0010039806365966797, 0.0010460913181304932, 0.0010882019996643066, 0.0011303126811981201, 0.0011724233627319336, 0.001214534044265747, 0.0012566447257995605, 0.001298755407333374, 0.0013408660888671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 20.0, 27.0, 35.0, 44.0, 89.0, 104.0, 142.0, 266.0, 381.0, 558.0, 931.0, 1436.0, 2421.0, 4361.0, 8479.0, 18028.0, 42162.0, 110200.0, 302873.0, 337153.0, 129158.0, 47914.0, 20440.0, 9449.0, 4912.0, 2693.0, 1532.0, 945.0, 604.0, 407.0, 256.0, 172.0, 109.0, 79.0, 56.0, 36.0, 31.0, 14.0, 14.0, 4.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.1484375, -14.6904296875, -14.232421875, -13.7744140625, -13.31640625, -12.8583984375, -12.400390625, -11.9423828125, -11.484375, -11.0263671875, -10.568359375, -10.1103515625, -9.65234375, -9.1943359375, -8.736328125, -8.2783203125, -7.8203125, -7.3623046875, -6.904296875, -6.4462890625, -5.98828125, -5.5302734375, -5.072265625, -4.6142578125, -4.15625, -3.6982421875, -3.240234375, -2.7822265625, -2.32421875, -1.8662109375, -1.408203125, -0.9501953125, -0.4921875, -0.0341796875, 0.423828125, 0.8818359375, 1.33984375, 1.7978515625, 2.255859375, 2.7138671875, 3.171875, 3.6298828125, 4.087890625, 4.5458984375, 5.00390625, 5.4619140625, 5.919921875, 6.3779296875, 6.8359375, 7.2939453125, 7.751953125, 8.2099609375, 8.66796875, 9.1259765625, 9.583984375, 10.0419921875, 10.5, 10.9580078125, 11.416015625, 11.8740234375, 12.33203125, 12.7900390625, 13.248046875, 13.7060546875, 14.1640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 5.0, 6.0, 13.0, 13.0, 13.0, 20.0, 21.0, 24.0, 36.0, 44.0, 34.0, 69.0, 51.0, 71.0, 79.0, 68.0, 94.0, 59.0, 45.0, 34.0, 38.0, 35.0, 18.0, 27.0, 17.0, 13.0, 10.0, 7.0, 9.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.79296875, -3.673370361328125, -3.55377197265625, -3.434173583984375, -3.3145751953125, -3.194976806640625, -3.07537841796875, -2.955780029296875, -2.836181640625, -2.716583251953125, -2.59698486328125, -2.477386474609375, -2.3577880859375, -2.238189697265625, -2.11859130859375, -1.998992919921875, -1.87939453125, -1.759796142578125, -1.64019775390625, -1.520599365234375, -1.4010009765625, -1.281402587890625, -1.16180419921875, -1.042205810546875, -0.922607421875, -0.803009033203125, -0.68341064453125, -0.563812255859375, -0.4442138671875, -0.324615478515625, -0.20501708984375, -0.085418701171875, 0.0341796875, 0.153778076171875, 0.27337646484375, 0.392974853515625, 0.5125732421875, 0.632171630859375, 0.75177001953125, 0.871368408203125, 0.990966796875, 1.110565185546875, 1.23016357421875, 1.349761962890625, 1.4693603515625, 1.588958740234375, 1.70855712890625, 1.828155517578125, 1.94775390625, 2.067352294921875, 2.18695068359375, 2.306549072265625, 2.4261474609375, 2.545745849609375, 2.66534423828125, 2.784942626953125, 2.904541015625, 3.024139404296875, 3.14373779296875, 3.263336181640625, 3.3829345703125, 3.502532958984375, 3.62213134765625, 3.741729736328125, 3.861328125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 0.0, 4.0, 4.0, 6.0, 12.0, 13.0, 13.0, 18.0, 18.0, 22.0, 25.0, 37.0, 31.0, 47.0, 37.0, 78.0, 67.0, 81.0, 60.0, 73.0, 62.0, 51.0, 45.0, 44.0, 37.0, 21.0, 19.0, 20.0, 13.0, 4.0, 8.0, 9.0, 8.0, 5.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.11933517456055, -35.052528381347656, -33.98572540283203, -32.91891860961914, -31.85211181640625, -30.78530502319336, -29.7185001373291, -28.651695251464844, -27.584888458251953, -26.518081665039062, -25.451276779174805, -24.384471893310547, -23.317665100097656, -22.250858306884766, -21.184053421020508, -20.11724853515625, -19.05044174194336, -17.98363494873047, -16.91683006286621, -15.850024223327637, -14.783218383789062, -13.716412544250488, -12.649606704711914, -11.58280086517334, -10.515995025634766, -9.449189186096191, -8.382383346557617, -7.315577507019043, -6.248771667480469, -5.1819658279418945, -4.11515998840332, -3.048354148864746, -1.9815483093261719, -0.9147424697875977, 0.15206336975097656, 1.2188692092895508, 2.285675048828125, 3.352480888366699, 4.419286727905273, 5.486092567443848, 6.552898406982422, 7.619704246520996, 8.68651008605957, 9.753315925598145, 10.820121765136719, 11.886927604675293, 12.953733444213867, 14.020539283752441, 15.087345123291016, 16.154151916503906, 17.220956802368164, 18.287761688232422, 19.354568481445312, 20.421375274658203, 21.48818016052246, 22.55498504638672, 23.62179183959961, 24.6885986328125, 25.755403518676758, 26.822208404541016, 27.889015197753906, 28.955821990966797, 30.022626876831055, 31.089431762695312, 32.1562385559082]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 8.0, 8.0, 7.0, 10.0, 10.0, 20.0, 11.0, 15.0, 17.0, 20.0, 28.0, 34.0, 29.0, 29.0, 37.0, 34.0, 42.0, 40.0, 40.0, 43.0, 55.0, 36.0, 35.0, 39.0, 38.0, 44.0, 20.0, 33.0, 28.0, 22.0, 24.0, 20.0, 16.0, 17.0, 17.0, 14.0, 11.0, 6.0, 12.0, 3.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.12033462524414, -26.297992706298828, -25.47565269470215, -24.65331268310547, -23.830970764160156, -23.008628845214844, -22.186288833618164, -21.363948822021484, -20.541606903076172, -19.71926498413086, -18.89692497253418, -18.0745849609375, -17.252243041992188, -16.429901123046875, -15.607561111450195, -14.7852201461792, -13.962879180908203, -13.140538215637207, -12.318197250366211, -11.495856285095215, -10.673515319824219, -9.851174354553223, -9.028833389282227, -8.20649242401123, -7.384151458740234, -6.561810493469238, -5.739469528198242, -4.917128562927246, -4.09478759765625, -3.272446632385254, -2.450105667114258, -1.6277647018432617, -0.8054256439208984, 0.016915321350097656, 0.8392562866210938, 1.6615972518920898, 2.483938217163086, 3.306279182434082, 4.128620147705078, 4.950961112976074, 5.77330207824707, 6.595643043518066, 7.4179840087890625, 8.240324974060059, 9.062665939331055, 9.88500690460205, 10.707347869873047, 11.529688835144043, 12.352029800415039, 13.174370765686035, 13.996711730957031, 14.819052696228027, 15.641393661499023, 16.463733673095703, 17.286075592041016, 18.108417510986328, 18.930757522583008, 19.753097534179688, 20.575439453125, 21.397781372070312, 22.220121383666992, 23.042461395263672, 23.864803314208984, 24.687145233154297, 25.509485244750977]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 11.0, 23.0, 26.0, 50.0, 61.0, 86.0, 136.0, 185.0, 267.0, 462.0, 668.0, 1018.0, 1528.0, 2482.0, 4022.0, 6486.0, 10565.0, 17866.0, 30177.0, 51644.0, 90415.0, 155859.0, 223901.0, 185500.0, 110358.0, 62959.0, 36558.0, 21603.0, 12812.0, 7783.0, 4844.0, 2892.0, 1879.0, 1202.0, 747.0, 493.0, 330.0, 186.0, 145.0, 105.0, 83.0, 40.0, 25.0, 24.0, 19.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-34.5, -33.4443359375, -32.388671875, -31.3330078125, -30.27734375, -29.2216796875, -28.166015625, -27.1103515625, -26.0546875, -24.9990234375, -23.943359375, -22.8876953125, -21.83203125, -20.7763671875, -19.720703125, -18.6650390625, -17.609375, -16.5537109375, -15.498046875, -14.4423828125, -13.38671875, -12.3310546875, -11.275390625, -10.2197265625, -9.1640625, -8.1083984375, -7.052734375, -5.9970703125, -4.94140625, -3.8857421875, -2.830078125, -1.7744140625, -0.71875, 0.3369140625, 1.392578125, 2.4482421875, 3.50390625, 4.5595703125, 5.615234375, 6.6708984375, 7.7265625, 8.7822265625, 9.837890625, 10.8935546875, 11.94921875, 13.0048828125, 14.060546875, 15.1162109375, 16.171875, 17.2275390625, 18.283203125, 19.3388671875, 20.39453125, 21.4501953125, 22.505859375, 23.5615234375, 24.6171875, 25.6728515625, 26.728515625, 27.7841796875, 28.83984375, 29.8955078125, 30.951171875, 32.0068359375, 33.0625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 7.0, 14.0, 8.0, 7.0, 21.0, 16.0, 21.0, 25.0, 17.0, 31.0, 32.0, 31.0, 32.0, 34.0, 51.0, 50.0, 49.0, 44.0, 49.0, 51.0, 42.0, 39.0, 37.0, 36.0, 30.0, 23.0, 29.0, 21.0, 29.0, 17.0, 16.0, 19.0, 13.0, 10.0, 9.0, 4.0, 9.0, 1.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.25, -28.353759765625, -27.45751953125, -26.561279296875, -25.6650390625, -24.768798828125, -23.87255859375, -22.976318359375, -22.080078125, -21.183837890625, -20.28759765625, -19.391357421875, -18.4951171875, -17.598876953125, -16.70263671875, -15.806396484375, -14.91015625, -14.013916015625, -13.11767578125, -12.221435546875, -11.3251953125, -10.428955078125, -9.53271484375, -8.636474609375, -7.740234375, -6.843994140625, -5.94775390625, -5.051513671875, -4.1552734375, -3.259033203125, -2.36279296875, -1.466552734375, -0.5703125, 0.325927734375, 1.22216796875, 2.118408203125, 3.0146484375, 3.910888671875, 4.80712890625, 5.703369140625, 6.599609375, 7.495849609375, 8.39208984375, 9.288330078125, 10.1845703125, 11.080810546875, 11.97705078125, 12.873291015625, 13.76953125, 14.665771484375, 15.56201171875, 16.458251953125, 17.3544921875, 18.250732421875, 19.14697265625, 20.043212890625, 20.939453125, 21.835693359375, 22.73193359375, 23.628173828125, 24.5244140625, 25.420654296875, 26.31689453125, 27.213134765625, 28.109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 10.0, 16.0, 16.0, 33.0, 45.0, 72.0, 94.0, 156.0, 214.0, 336.0, 521.0, 774.0, 1145.0, 1670.0, 2568.0, 4167.0, 6660.0, 10820.0, 17870.0, 30627.0, 53721.0, 91574.0, 150177.0, 205882.0, 181913.0, 117987.0, 69567.0, 39868.0, 22959.0, 13917.0, 8489.0, 5319.0, 3217.0, 2074.0, 1349.0, 924.0, 613.0, 412.0, 249.0, 190.0, 109.0, 75.0, 53.0, 45.0, 28.0, 15.0, 5.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.4375, -35.28955078125, -34.1416015625, -32.99365234375, -31.845703125, -30.69775390625, -29.5498046875, -28.40185546875, -27.25390625, -26.10595703125, -24.9580078125, -23.81005859375, -22.662109375, -21.51416015625, -20.3662109375, -19.21826171875, -18.0703125, -16.92236328125, -15.7744140625, -14.62646484375, -13.478515625, -12.33056640625, -11.1826171875, -10.03466796875, -8.88671875, -7.73876953125, -6.5908203125, -5.44287109375, -4.294921875, -3.14697265625, -1.9990234375, -0.85107421875, 0.296875, 1.44482421875, 2.5927734375, 3.74072265625, 4.888671875, 6.03662109375, 7.1845703125, 8.33251953125, 9.48046875, 10.62841796875, 11.7763671875, 12.92431640625, 14.072265625, 15.22021484375, 16.3681640625, 17.51611328125, 18.6640625, 19.81201171875, 20.9599609375, 22.10791015625, 23.255859375, 24.40380859375, 25.5517578125, 26.69970703125, 27.84765625, 28.99560546875, 30.1435546875, 31.29150390625, 32.439453125, 33.58740234375, 34.7353515625, 35.88330078125, 37.03125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 6.0, 7.0, 13.0, 8.0, 13.0, 12.0, 20.0, 26.0, 31.0, 39.0, 29.0, 29.0, 35.0, 44.0, 35.0, 46.0, 32.0, 36.0, 27.0, 40.0, 42.0, 48.0, 37.0, 36.0, 27.0, 30.0, 43.0, 39.0, 27.0, 24.0, 16.0, 15.0, 11.0, 10.0, 5.0, 13.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.34375, -15.7919921875, -15.240234375, -14.6884765625, -14.13671875, -13.5849609375, -13.033203125, -12.4814453125, -11.9296875, -11.3779296875, -10.826171875, -10.2744140625, -9.72265625, -9.1708984375, -8.619140625, -8.0673828125, -7.515625, -6.9638671875, -6.412109375, -5.8603515625, -5.30859375, -4.7568359375, -4.205078125, -3.6533203125, -3.1015625, -2.5498046875, -1.998046875, -1.4462890625, -0.89453125, -0.3427734375, 0.208984375, 0.7607421875, 1.3125, 1.8642578125, 2.416015625, 2.9677734375, 3.51953125, 4.0712890625, 4.623046875, 5.1748046875, 5.7265625, 6.2783203125, 6.830078125, 7.3818359375, 7.93359375, 8.4853515625, 9.037109375, 9.5888671875, 10.140625, 10.6923828125, 11.244140625, 11.7958984375, 12.34765625, 12.8994140625, 13.451171875, 14.0029296875, 14.5546875, 15.1064453125, 15.658203125, 16.2099609375, 16.76171875, 17.3134765625, 17.865234375, 18.4169921875, 18.96875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 8.0, 8.0, 14.0, 23.0, 21.0, 44.0, 66.0, 68.0, 122.0, 185.0, 291.0, 395.0, 608.0, 1017.0, 1666.0, 3040.0, 5700.0, 11886.0, 27226.0, 70105.0, 209928.0, 423218.0, 183367.0, 62248.0, 24285.0, 10688.0, 5259.0, 2680.0, 1602.0, 951.0, 580.0, 409.0, 269.0, 171.0, 125.0, 92.0, 60.0, 41.0, 33.0, 20.0, 10.0, 12.0, 6.0, 7.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.109375, -20.392333984375, -19.67529296875, -18.958251953125, -18.2412109375, -17.524169921875, -16.80712890625, -16.090087890625, -15.373046875, -14.656005859375, -13.93896484375, -13.221923828125, -12.5048828125, -11.787841796875, -11.07080078125, -10.353759765625, -9.63671875, -8.919677734375, -8.20263671875, -7.485595703125, -6.7685546875, -6.051513671875, -5.33447265625, -4.617431640625, -3.900390625, -3.183349609375, -2.46630859375, -1.749267578125, -1.0322265625, -0.315185546875, 0.40185546875, 1.118896484375, 1.8359375, 2.552978515625, 3.27001953125, 3.987060546875, 4.7041015625, 5.421142578125, 6.13818359375, 6.855224609375, 7.572265625, 8.289306640625, 9.00634765625, 9.723388671875, 10.4404296875, 11.157470703125, 11.87451171875, 12.591552734375, 13.30859375, 14.025634765625, 14.74267578125, 15.459716796875, 16.1767578125, 16.893798828125, 17.61083984375, 18.327880859375, 19.044921875, 19.761962890625, 20.47900390625, 21.196044921875, 21.9130859375, 22.630126953125, 23.34716796875, 24.064208984375, 24.78125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 5.0, 13.0, 10.0, 27.0, 39.0, 54.0, 81.0, 125.0, 201.0, 166.0, 106.0, 57.0, 35.0, 20.0, 16.0, 11.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027484893798828125, -0.002658754587173462, -0.0025690197944641113, -0.0024792850017547607, -0.00238955020904541, -0.0022998154163360596, -0.002210080623626709, -0.0021203458309173584, -0.002030611038208008, -0.0019408762454986572, -0.0018511414527893066, -0.001761406660079956, -0.0016716718673706055, -0.0015819370746612549, -0.0014922022819519043, -0.0014024674892425537, -0.0013127326965332031, -0.0012229979038238525, -0.001133263111114502, -0.0010435283184051514, -0.0009537935256958008, -0.0008640587329864502, -0.0007743239402770996, -0.000684589147567749, -0.0005948543548583984, -0.0005051195621490479, -0.00041538476943969727, -0.0003256499767303467, -0.0002359151840209961, -0.0001461803913116455, -5.644559860229492e-05, 3.3289194107055664e-05, 0.00012302398681640625, 0.00021275877952575684, 0.0003024935722351074, 0.000392228364944458, 0.0004819631576538086, 0.0005716979503631592, 0.0006614327430725098, 0.0007511675357818604, 0.0008409023284912109, 0.0009306371212005615, 0.0010203719139099121, 0.0011101067066192627, 0.0011998414993286133, 0.0012895762920379639, 0.0013793110847473145, 0.001469045877456665, 0.0015587806701660156, 0.0016485154628753662, 0.0017382502555847168, 0.0018279850482940674, 0.001917719841003418, 0.0020074546337127686, 0.002097189426422119, 0.0021869242191314697, 0.0022766590118408203, 0.002366393804550171, 0.0024561285972595215, 0.002545863389968872, 0.0026355981826782227, 0.0027253329753875732, 0.002815067768096924, 0.0029048025608062744, 0.002994537353515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 15.0, 23.0, 38.0, 37.0, 56.0, 79.0, 109.0, 137.0, 188.0, 315.0, 418.0, 631.0, 993.0, 1495.0, 2242.0, 3685.0, 6216.0, 10991.0, 19692.0, 37247.0, 74553.0, 156111.0, 280633.0, 225012.0, 109639.0, 53671.0, 27452.0, 15172.0, 8334.0, 4905.0, 2913.0, 1824.0, 1176.0, 790.0, 548.0, 364.0, 222.0, 167.0, 117.0, 81.0, 62.0, 48.0, 23.0, 33.0, 18.0, 18.0, 9.0, 13.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0], "bins": [-14.78125, -14.28466796875, -13.7880859375, -13.29150390625, -12.794921875, -12.29833984375, -11.8017578125, -11.30517578125, -10.80859375, -10.31201171875, -9.8154296875, -9.31884765625, -8.822265625, -8.32568359375, -7.8291015625, -7.33251953125, -6.8359375, -6.33935546875, -5.8427734375, -5.34619140625, -4.849609375, -4.35302734375, -3.8564453125, -3.35986328125, -2.86328125, -2.36669921875, -1.8701171875, -1.37353515625, -0.876953125, -0.38037109375, 0.1162109375, 0.61279296875, 1.109375, 1.60595703125, 2.1025390625, 2.59912109375, 3.095703125, 3.59228515625, 4.0888671875, 4.58544921875, 5.08203125, 5.57861328125, 6.0751953125, 6.57177734375, 7.068359375, 7.56494140625, 8.0615234375, 8.55810546875, 9.0546875, 9.55126953125, 10.0478515625, 10.54443359375, 11.041015625, 11.53759765625, 12.0341796875, 12.53076171875, 13.02734375, 13.52392578125, 14.0205078125, 14.51708984375, 15.013671875, 15.51025390625, 16.0068359375, 16.50341796875, 17.0]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 4.0, 3.0, 4.0, 12.0, 13.0, 10.0, 13.0, 13.0, 23.0, 15.0, 41.0, 32.0, 44.0, 60.0, 53.0, 82.0, 87.0, 80.0, 68.0, 53.0, 40.0, 34.0, 37.0, 26.0, 30.0, 21.0, 21.0, 12.0, 23.0, 12.0, 4.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.97265625, -4.8109130859375, -4.649169921875, -4.4874267578125, -4.32568359375, -4.1639404296875, -4.002197265625, -3.8404541015625, -3.6787109375, -3.5169677734375, -3.355224609375, -3.1934814453125, -3.03173828125, -2.8699951171875, -2.708251953125, -2.5465087890625, -2.384765625, -2.2230224609375, -2.061279296875, -1.8995361328125, -1.73779296875, -1.5760498046875, -1.414306640625, -1.2525634765625, -1.0908203125, -0.9290771484375, -0.767333984375, -0.6055908203125, -0.44384765625, -0.2821044921875, -0.120361328125, 0.0413818359375, 0.203125, 0.3648681640625, 0.526611328125, 0.6883544921875, 0.85009765625, 1.0118408203125, 1.173583984375, 1.3353271484375, 1.4970703125, 1.6588134765625, 1.820556640625, 1.9822998046875, 2.14404296875, 2.3057861328125, 2.467529296875, 2.6292724609375, 2.791015625, 2.9527587890625, 3.114501953125, 3.2762451171875, 3.43798828125, 3.5997314453125, 3.761474609375, 3.9232177734375, 4.0849609375, 4.2467041015625, 4.408447265625, 4.5701904296875, 4.73193359375, 4.8936767578125, 5.055419921875, 5.2171630859375, 5.37890625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 1.0, 6.0, 3.0, 8.0, 5.0, 9.0, 11.0, 12.0, 14.0, 17.0, 24.0, 30.0, 35.0, 55.0, 40.0, 56.0, 76.0, 90.0, 67.0, 73.0, 64.0, 54.0, 52.0, 43.0, 39.0, 26.0, 20.0, 12.0, 14.0, 10.0, 7.0, 10.0, 4.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.735443115234375, -35.59249496459961, -34.44954299926758, -33.30659484863281, -32.16364288330078, -31.020694732666016, -29.877744674682617, -28.73479461669922, -27.59184455871582, -26.448894500732422, -25.305944442749023, -24.162994384765625, -23.02004623413086, -21.877094268798828, -20.734146118164062, -19.591196060180664, -18.448246002197266, -17.305295944213867, -16.16234588623047, -15.019396781921387, -13.876446723937988, -12.73349666595459, -11.590547561645508, -10.44759750366211, -9.304647445678711, -8.161697387695312, -7.018747806549072, -5.875798225402832, -4.732848167419434, -3.589898109436035, -2.446948528289795, -1.3039989471435547, -0.16104507446289062, 0.9819047451019287, 2.124854564666748, 3.2678043842315674, 4.410754203796387, 5.553704261779785, 6.696653842926025, 7.839603424072266, 8.982553482055664, 10.125503540039062, 11.268453598022461, 12.411402702331543, 13.554352760314941, 14.69730281829834, 15.840251922607422, 16.98320198059082, 18.12615203857422, 19.269102096557617, 20.412052154541016, 21.555002212524414, 22.697952270507812, 23.840900421142578, 24.983850479125977, 26.126800537109375, 27.269750595092773, 28.412700653076172, 29.55565071105957, 30.69860076904297, 31.841548919677734, 32.984500885009766, 34.12744903564453, 35.27040100097656, 36.41334915161133]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 10.0, 10.0, 7.0, 10.0, 13.0, 13.0, 21.0, 23.0, 26.0, 29.0, 45.0, 35.0, 38.0, 33.0, 31.0, 45.0, 50.0, 40.0, 47.0, 37.0, 37.0, 39.0, 43.0, 43.0, 44.0, 25.0, 32.0, 26.0, 21.0, 29.0, 17.0, 17.0, 14.0, 7.0, 14.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.86671257019043, -25.917133331298828, -24.967554092407227, -24.017974853515625, -23.068397521972656, -22.118816375732422, -21.169239044189453, -20.21965980529785, -19.27008056640625, -18.32050132751465, -17.370922088623047, -16.421342849731445, -15.47176456451416, -14.522185325622559, -13.572607040405273, -12.623027801513672, -11.67344856262207, -10.723869323730469, -9.774290084838867, -8.824711799621582, -7.8751325607299805, -6.925553321838379, -5.9759745597839355, -5.026395797729492, -4.076816558837891, -3.127237558364868, -2.1776585578918457, -1.2280795574188232, -0.2785005569458008, 0.6710786819458008, 1.6206574440002441, 2.5702362060546875, 3.5198135375976562, 4.469392776489258, 5.418971538543701, 6.3685503005981445, 7.318129539489746, 8.267708778381348, 9.217287063598633, 10.166866302490234, 11.116445541381836, 12.066024780273438, 13.015604019165039, 13.965182304382324, 14.914761543273926, 15.864340782165527, 16.813919067382812, 17.763498306274414, 18.713077545166016, 19.662656784057617, 20.61223602294922, 21.56181526184082, 22.511394500732422, 23.46097183227539, 24.410551071166992, 25.360130310058594, 26.309709548950195, 27.259288787841797, 28.2088680267334, 29.158447265625, 30.10802459716797, 31.057605743408203, 32.00718307495117, 32.956764221191406, 33.906341552734375]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 12.0, 18.0, 19.0, 25.0, 44.0, 71.0, 76.0, 118.0, 197.0, 265.0, 390.0, 572.0, 816.0, 1203.0, 1902.0, 2836.0, 4372.0, 7179.0, 11711.0, 20385.0, 37611.0, 77496.0, 183391.0, 533117.0, 1277159.0, 1214469.0, 480743.0, 175517.0, 74058.0, 37242.0, 20494.0, 11794.0, 6987.0, 4307.0, 2668.0, 1668.0, 1178.0, 735.0, 471.0, 308.0, 209.0, 151.0, 91.0, 61.0, 47.0, 39.0, 18.0, 12.0, 8.0, 13.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.5625, -31.39794921875, -30.2333984375, -29.06884765625, -27.904296875, -26.73974609375, -25.5751953125, -24.41064453125, -23.24609375, -22.08154296875, -20.9169921875, -19.75244140625, -18.587890625, -17.42333984375, -16.2587890625, -15.09423828125, -13.9296875, -12.76513671875, -11.6005859375, -10.43603515625, -9.271484375, -8.10693359375, -6.9423828125, -5.77783203125, -4.61328125, -3.44873046875, -2.2841796875, -1.11962890625, 0.044921875, 1.20947265625, 2.3740234375, 3.53857421875, 4.703125, 5.86767578125, 7.0322265625, 8.19677734375, 9.361328125, 10.52587890625, 11.6904296875, 12.85498046875, 14.01953125, 15.18408203125, 16.3486328125, 17.51318359375, 18.677734375, 19.84228515625, 21.0068359375, 22.17138671875, 23.3359375, 24.50048828125, 25.6650390625, 26.82958984375, 27.994140625, 29.15869140625, 30.3232421875, 31.48779296875, 32.65234375, 33.81689453125, 34.9814453125, 36.14599609375, 37.310546875, 38.47509765625, 39.6396484375, 40.80419921875, 41.96875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 2.0, 5.0, 11.0, 9.0, 10.0, 18.0, 22.0, 25.0, 26.0, 28.0, 43.0, 47.0, 27.0, 52.0, 35.0, 49.0, 44.0, 51.0, 51.0, 38.0, 32.0, 52.0, 40.0, 39.0, 38.0, 32.0, 19.0, 23.0, 20.0, 34.0, 12.0, 14.0, 14.0, 5.0, 8.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.49072265625, -22.6064453125, -21.72216796875, -20.837890625, -19.95361328125, -19.0693359375, -18.18505859375, -17.30078125, -16.41650390625, -15.5322265625, -14.64794921875, -13.763671875, -12.87939453125, -11.9951171875, -11.11083984375, -10.2265625, -9.34228515625, -8.4580078125, -7.57373046875, -6.689453125, -5.80517578125, -4.9208984375, -4.03662109375, -3.15234375, -2.26806640625, -1.3837890625, -0.49951171875, 0.384765625, 1.26904296875, 2.1533203125, 3.03759765625, 3.921875, 4.80615234375, 5.6904296875, 6.57470703125, 7.458984375, 8.34326171875, 9.2275390625, 10.11181640625, 10.99609375, 11.88037109375, 12.7646484375, 13.64892578125, 14.533203125, 15.41748046875, 16.3017578125, 17.18603515625, 18.0703125, 18.95458984375, 19.8388671875, 20.72314453125, 21.607421875, 22.49169921875, 23.3759765625, 24.26025390625, 25.14453125, 26.02880859375, 26.9130859375, 27.79736328125, 28.681640625, 29.56591796875, 30.4501953125, 31.33447265625, 32.21875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 15.0, 18.0, 12.0, 25.0, 39.0, 65.0, 84.0, 125.0, 159.0, 239.0, 366.0, 577.0, 779.0, 1158.0, 1687.0, 2609.0, 3975.0, 6297.0, 10359.0, 16809.0, 28425.0, 50058.0, 93015.0, 182286.0, 385855.0, 886596.0, 1299613.0, 630591.0, 282965.0, 137642.0, 72103.0, 39403.0, 22726.0, 13624.0, 8399.0, 5280.0, 3483.0, 2263.0, 1458.0, 1006.0, 652.0, 471.0, 317.0, 197.0, 162.0, 101.0, 62.0, 44.0, 27.0, 19.0, 19.0, 14.0, 10.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-37.25, -36.0966796875, -34.943359375, -33.7900390625, -32.63671875, -31.4833984375, -30.330078125, -29.1767578125, -28.0234375, -26.8701171875, -25.716796875, -24.5634765625, -23.41015625, -22.2568359375, -21.103515625, -19.9501953125, -18.796875, -17.6435546875, -16.490234375, -15.3369140625, -14.18359375, -13.0302734375, -11.876953125, -10.7236328125, -9.5703125, -8.4169921875, -7.263671875, -6.1103515625, -4.95703125, -3.8037109375, -2.650390625, -1.4970703125, -0.34375, 0.8095703125, 1.962890625, 3.1162109375, 4.26953125, 5.4228515625, 6.576171875, 7.7294921875, 8.8828125, 10.0361328125, 11.189453125, 12.3427734375, 13.49609375, 14.6494140625, 15.802734375, 16.9560546875, 18.109375, 19.2626953125, 20.416015625, 21.5693359375, 22.72265625, 23.8759765625, 25.029296875, 26.1826171875, 27.3359375, 28.4892578125, 29.642578125, 30.7958984375, 31.94921875, 33.1025390625, 34.255859375, 35.4091796875, 36.5625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 12.0, 12.0, 14.0, 20.0, 18.0, 26.0, 34.0, 30.0, 38.0, 61.0, 82.0, 105.0, 119.0, 140.0, 189.0, 234.0, 268.0, 330.0, 370.0, 346.0, 281.0, 256.0, 191.0, 164.0, 134.0, 129.0, 88.0, 84.0, 52.0, 44.0, 39.0, 34.0, 28.0, 28.0, 15.0, 13.0, 6.0, 7.0, 5.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-12.78125, -12.3785400390625, -11.975830078125, -11.5731201171875, -11.17041015625, -10.7677001953125, -10.364990234375, -9.9622802734375, -9.5595703125, -9.1568603515625, -8.754150390625, -8.3514404296875, -7.94873046875, -7.5460205078125, -7.143310546875, -6.7406005859375, -6.337890625, -5.9351806640625, -5.532470703125, -5.1297607421875, -4.72705078125, -4.3243408203125, -3.921630859375, -3.5189208984375, -3.1162109375, -2.7135009765625, -2.310791015625, -1.9080810546875, -1.50537109375, -1.1026611328125, -0.699951171875, -0.2972412109375, 0.10546875, 0.5081787109375, 0.910888671875, 1.3135986328125, 1.71630859375, 2.1190185546875, 2.521728515625, 2.9244384765625, 3.3271484375, 3.7298583984375, 4.132568359375, 4.5352783203125, 4.93798828125, 5.3406982421875, 5.743408203125, 6.1461181640625, 6.548828125, 6.9515380859375, 7.354248046875, 7.7569580078125, 8.15966796875, 8.5623779296875, 8.965087890625, 9.3677978515625, 9.7705078125, 10.1732177734375, 10.575927734375, 10.9786376953125, 11.38134765625, 11.7840576171875, 12.186767578125, 12.5894775390625, 12.9921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 7.0, 6.0, 12.0, 17.0, 15.0, 19.0, 28.0, 37.0, 43.0, 58.0, 71.0, 67.0, 68.0, 61.0, 60.0, 71.0, 71.0, 52.0, 51.0, 33.0, 29.0, 24.0, 21.0, 14.0, 7.0, 12.0, 8.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.9119758605957, -35.81083679199219, -34.709693908691406, -33.60855484008789, -32.507415771484375, -31.406272888183594, -30.305133819580078, -29.20399284362793, -28.10285186767578, -27.001710891723633, -25.900569915771484, -24.79943084716797, -23.69828987121582, -22.597148895263672, -21.496009826660156, -20.394868850708008, -19.29372787475586, -18.19258689880371, -17.091445922851562, -15.990306854248047, -14.889165878295898, -13.78802490234375, -12.686884880065918, -11.585744857788086, -10.484603881835938, -9.383462905883789, -8.282322883605957, -7.181182384490967, -6.080041885375977, -4.978901386260986, -3.877760887145996, -2.776620388031006, -1.6754798889160156, -0.5743393898010254, 0.5268011093139648, 1.627941608428955, 2.7290821075439453, 3.8302226066589355, 4.931363105773926, 6.032503604888916, 7.133644104003906, 8.234785079956055, 9.335925102233887, 10.437065124511719, 11.538206100463867, 12.639347076416016, 13.740487098693848, 14.84162712097168, 15.942768096923828, 17.043909072875977, 18.145050048828125, 19.24618911743164, 20.34733009338379, 21.448471069335938, 22.549610137939453, 23.6507511138916, 24.75189208984375, 25.8530330657959, 26.954174041748047, 28.055313110351562, 29.15645408630371, 30.25759506225586, 31.358734130859375, 32.459877014160156, 33.56101608276367]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 12.0, 9.0, 10.0, 8.0, 18.0, 15.0, 28.0, 21.0, 23.0, 31.0, 32.0, 37.0, 24.0, 32.0, 31.0, 36.0, 45.0, 53.0, 38.0, 37.0, 34.0, 60.0, 27.0, 35.0, 24.0, 29.0, 34.0, 30.0, 20.0, 30.0, 17.0, 25.0, 15.0, 11.0, 10.0, 8.0, 10.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.57047462463379, -25.722055435180664, -24.87363624572754, -24.025217056274414, -23.17679786682129, -22.328378677368164, -21.47995948791504, -20.631540298461914, -19.78312110900879, -18.934701919555664, -18.08628273010254, -17.237863540649414, -16.38944435119629, -15.541025161743164, -14.692605972290039, -13.844186782836914, -12.995767593383789, -12.147348403930664, -11.298929214477539, -10.450510025024414, -9.602090835571289, -8.753671646118164, -7.905252456665039, -7.056833267211914, -6.208414077758789, -5.359994888305664, -4.511575698852539, -3.663156509399414, -2.814737319946289, -1.966318130493164, -1.117898941040039, -0.26947975158691406, 0.5789413452148438, 1.4273605346679688, 2.2757797241210938, 3.1241989135742188, 3.9726181030273438, 4.821037292480469, 5.669456481933594, 6.517875671386719, 7.366294860839844, 8.214714050292969, 9.063133239746094, 9.911552429199219, 10.759971618652344, 11.608390808105469, 12.456809997558594, 13.305229187011719, 14.153648376464844, 15.002067565917969, 15.850486755371094, 16.69890594482422, 17.547325134277344, 18.39574432373047, 19.244163513183594, 20.09258270263672, 20.941001892089844, 21.78942108154297, 22.637840270996094, 23.48625946044922, 24.334678649902344, 25.18309783935547, 26.031517028808594, 26.87993621826172, 27.728355407714844]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 5.0, 15.0, 16.0, 27.0, 44.0, 45.0, 70.0, 96.0, 143.0, 184.0, 309.0, 418.0, 566.0, 819.0, 1226.0, 1890.0, 2784.0, 4068.0, 6376.0, 9887.0, 15692.0, 24234.0, 39118.0, 65207.0, 112547.0, 192558.0, 222163.0, 138914.0, 79704.0, 47739.0, 29465.0, 18334.0, 11453.0, 7454.0, 4921.0, 3231.0, 2199.0, 1477.0, 956.0, 679.0, 451.0, 321.0, 238.0, 153.0, 100.0, 88.0, 51.0, 31.0, 23.0, 26.0, 16.0, 6.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0], "bins": [-18.453125, -17.8798828125, -17.306640625, -16.7333984375, -16.16015625, -15.5869140625, -15.013671875, -14.4404296875, -13.8671875, -13.2939453125, -12.720703125, -12.1474609375, -11.57421875, -11.0009765625, -10.427734375, -9.8544921875, -9.28125, -8.7080078125, -8.134765625, -7.5615234375, -6.98828125, -6.4150390625, -5.841796875, -5.2685546875, -4.6953125, -4.1220703125, -3.548828125, -2.9755859375, -2.40234375, -1.8291015625, -1.255859375, -0.6826171875, -0.109375, 0.4638671875, 1.037109375, 1.6103515625, 2.18359375, 2.7568359375, 3.330078125, 3.9033203125, 4.4765625, 5.0498046875, 5.623046875, 6.1962890625, 6.76953125, 7.3427734375, 7.916015625, 8.4892578125, 9.0625, 9.6357421875, 10.208984375, 10.7822265625, 11.35546875, 11.9287109375, 12.501953125, 13.0751953125, 13.6484375, 14.2216796875, 14.794921875, 15.3681640625, 15.94140625, 16.5146484375, 17.087890625, 17.6611328125, 18.234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 7.0, 13.0, 6.0, 13.0, 21.0, 26.0, 31.0, 33.0, 31.0, 35.0, 31.0, 31.0, 26.0, 30.0, 36.0, 51.0, 46.0, 38.0, 51.0, 42.0, 50.0, 33.0, 33.0, 27.0, 32.0, 22.0, 29.0, 22.0, 19.0, 15.0, 18.0, 15.0, 11.0, 9.0, 5.0, 12.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-27.8125, -26.935546875, -26.05859375, -25.181640625, -24.3046875, -23.427734375, -22.55078125, -21.673828125, -20.796875, -19.919921875, -19.04296875, -18.166015625, -17.2890625, -16.412109375, -15.53515625, -14.658203125, -13.78125, -12.904296875, -12.02734375, -11.150390625, -10.2734375, -9.396484375, -8.51953125, -7.642578125, -6.765625, -5.888671875, -5.01171875, -4.134765625, -3.2578125, -2.380859375, -1.50390625, -0.626953125, 0.25, 1.126953125, 2.00390625, 2.880859375, 3.7578125, 4.634765625, 5.51171875, 6.388671875, 7.265625, 8.142578125, 9.01953125, 9.896484375, 10.7734375, 11.650390625, 12.52734375, 13.404296875, 14.28125, 15.158203125, 16.03515625, 16.912109375, 17.7890625, 18.666015625, 19.54296875, 20.419921875, 21.296875, 22.173828125, 23.05078125, 23.927734375, 24.8046875, 25.681640625, 26.55859375, 27.435546875, 28.3125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 13.0, 15.0, 22.0, 24.0, 53.0, 60.0, 118.0, 158.0, 220.0, 375.0, 620.0, 899.0, 1390.0, 2304.0, 3907.0, 6554.0, 11660.0, 21292.0, 41404.0, 89085.0, 231667.0, 359984.0, 146292.0, 61939.0, 30226.0, 16078.0, 8808.0, 5171.0, 3117.0, 1833.0, 1200.0, 704.0, 448.0, 321.0, 201.0, 122.0, 77.0, 51.0, 40.0, 27.0, 19.0, 20.0, 14.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0], "bins": [-38.0, -36.952392578125, -35.90478515625, -34.857177734375, -33.8095703125, -32.761962890625, -31.71435546875, -30.666748046875, -29.619140625, -28.571533203125, -27.52392578125, -26.476318359375, -25.4287109375, -24.381103515625, -23.33349609375, -22.285888671875, -21.23828125, -20.190673828125, -19.14306640625, -18.095458984375, -17.0478515625, -16.000244140625, -14.95263671875, -13.905029296875, -12.857421875, -11.809814453125, -10.76220703125, -9.714599609375, -8.6669921875, -7.619384765625, -6.57177734375, -5.524169921875, -4.4765625, -3.428955078125, -2.38134765625, -1.333740234375, -0.2861328125, 0.761474609375, 1.80908203125, 2.856689453125, 3.904296875, 4.951904296875, 5.99951171875, 7.047119140625, 8.0947265625, 9.142333984375, 10.18994140625, 11.237548828125, 12.28515625, 13.332763671875, 14.38037109375, 15.427978515625, 16.4755859375, 17.523193359375, 18.57080078125, 19.618408203125, 20.666015625, 21.713623046875, 22.76123046875, 23.808837890625, 24.8564453125, 25.904052734375, 26.95166015625, 27.999267578125, 29.046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 18.0, 11.0, 19.0, 14.0, 19.0, 26.0, 29.0, 15.0, 30.0, 30.0, 40.0, 41.0, 40.0, 42.0, 38.0, 45.0, 44.0, 35.0, 44.0, 34.0, 30.0, 35.0, 31.0, 33.0, 30.0, 27.0, 26.0, 24.0, 19.0, 13.0, 26.0, 13.0, 9.0, 7.0, 7.0, 7.0, 9.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-18.28125, -17.7333984375, -17.185546875, -16.6376953125, -16.08984375, -15.5419921875, -14.994140625, -14.4462890625, -13.8984375, -13.3505859375, -12.802734375, -12.2548828125, -11.70703125, -11.1591796875, -10.611328125, -10.0634765625, -9.515625, -8.9677734375, -8.419921875, -7.8720703125, -7.32421875, -6.7763671875, -6.228515625, -5.6806640625, -5.1328125, -4.5849609375, -4.037109375, -3.4892578125, -2.94140625, -2.3935546875, -1.845703125, -1.2978515625, -0.75, -0.2021484375, 0.345703125, 0.8935546875, 1.44140625, 1.9892578125, 2.537109375, 3.0849609375, 3.6328125, 4.1806640625, 4.728515625, 5.2763671875, 5.82421875, 6.3720703125, 6.919921875, 7.4677734375, 8.015625, 8.5634765625, 9.111328125, 9.6591796875, 10.20703125, 10.7548828125, 11.302734375, 11.8505859375, 12.3984375, 12.9462890625, 13.494140625, 14.0419921875, 14.58984375, 15.1376953125, 15.685546875, 16.2333984375, 16.78125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 12.0, 17.0, 14.0, 34.0, 29.0, 69.0, 94.0, 169.0, 303.0, 586.0, 1068.0, 2033.0, 4140.0, 9580.0, 24473.0, 73042.0, 253905.0, 444599.0, 156431.0, 47178.0, 17187.0, 6979.0, 3239.0, 1493.0, 796.0, 451.0, 240.0, 124.0, 88.0, 48.0, 33.0, 32.0, 17.0, 9.0, 10.0, 5.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.421875, -10.126708984375, -9.83154296875, -9.536376953125, -9.2412109375, -8.946044921875, -8.65087890625, -8.355712890625, -8.060546875, -7.765380859375, -7.47021484375, -7.175048828125, -6.8798828125, -6.584716796875, -6.28955078125, -5.994384765625, -5.69921875, -5.404052734375, -5.10888671875, -4.813720703125, -4.5185546875, -4.223388671875, -3.92822265625, -3.633056640625, -3.337890625, -3.042724609375, -2.74755859375, -2.452392578125, -2.1572265625, -1.862060546875, -1.56689453125, -1.271728515625, -0.9765625, -0.681396484375, -0.38623046875, -0.091064453125, 0.2041015625, 0.499267578125, 0.79443359375, 1.089599609375, 1.384765625, 1.679931640625, 1.97509765625, 2.270263671875, 2.5654296875, 2.860595703125, 3.15576171875, 3.450927734375, 3.74609375, 4.041259765625, 4.33642578125, 4.631591796875, 4.9267578125, 5.221923828125, 5.51708984375, 5.812255859375, 6.107421875, 6.402587890625, 6.69775390625, 6.992919921875, 7.2880859375, 7.583251953125, 7.87841796875, 8.173583984375, 8.46875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 11.0, 11.0, 17.0, 20.0, 32.0, 43.0, 53.0, 82.0, 77.0, 106.0, 96.0, 87.0, 97.0, 87.0, 42.0, 29.0, 25.0, 19.0, 15.0, 15.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005488395690917969, -0.0005241706967353821, -0.0004995018243789673, -0.0004748329520225525, -0.0004501640796661377, -0.0004254952073097229, -0.0004008263349533081, -0.0003761574625968933, -0.0003514885902404785, -0.0003268197178840637, -0.0003021508455276489, -0.00027748197317123413, -0.00025281310081481934, -0.00022814422845840454, -0.00020347535610198975, -0.00017880648374557495, -0.00015413761138916016, -0.00012946873903274536, -0.00010479986667633057, -8.013099431991577e-05, -5.5462121963500977e-05, -3.079324960708618e-05, -6.124377250671387e-06, 1.8544495105743408e-05, 4.32133674621582e-05, 6.7882239818573e-05, 9.255111217498779e-05, 0.00011721998453140259, 0.00014188885688781738, 0.00016655772924423218, 0.00019122660160064697, 0.00021589547395706177, 0.00024056434631347656, 0.00026523321866989136, 0.00028990209102630615, 0.00031457096338272095, 0.00033923983573913574, 0.00036390870809555054, 0.00038857758045196533, 0.0004132464528083801, 0.0004379153251647949, 0.0004625841975212097, 0.0004872530698776245, 0.0005119219422340393, 0.0005365908145904541, 0.0005612596869468689, 0.0005859285593032837, 0.0006105974316596985, 0.0006352663040161133, 0.0006599351763725281, 0.0006846040487289429, 0.0007092729210853577, 0.0007339417934417725, 0.0007586106657981873, 0.000783279538154602, 0.0008079484105110168, 0.0008326172828674316, 0.0008572861552238464, 0.0008819550275802612, 0.000906623899936676, 0.0009312927722930908, 0.0009559616446495056, 0.0009806305170059204, 0.0010052993893623352, 0.00102996826171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 7.0, 8.0, 10.0, 17.0, 17.0, 42.0, 32.0, 50.0, 46.0, 96.0, 141.0, 219.0, 256.0, 487.0, 758.0, 1385.0, 2547.0, 5326.0, 11856.0, 28825.0, 76813.0, 216077.0, 383154.0, 199802.0, 71561.0, 26952.0, 11196.0, 5057.0, 2501.0, 1269.0, 695.0, 453.0, 247.0, 173.0, 141.0, 102.0, 57.0, 41.0, 41.0, 19.0, 22.0, 14.0, 5.0, 10.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-11.6484375, -11.3104248046875, -10.972412109375, -10.6343994140625, -10.29638671875, -9.9583740234375, -9.620361328125, -9.2823486328125, -8.9443359375, -8.6063232421875, -8.268310546875, -7.9302978515625, -7.59228515625, -7.2542724609375, -6.916259765625, -6.5782470703125, -6.240234375, -5.9022216796875, -5.564208984375, -5.2261962890625, -4.88818359375, -4.5501708984375, -4.212158203125, -3.8741455078125, -3.5361328125, -3.1981201171875, -2.860107421875, -2.5220947265625, -2.18408203125, -1.8460693359375, -1.508056640625, -1.1700439453125, -0.83203125, -0.4940185546875, -0.156005859375, 0.1820068359375, 0.52001953125, 0.8580322265625, 1.196044921875, 1.5340576171875, 1.8720703125, 2.2100830078125, 2.548095703125, 2.8861083984375, 3.22412109375, 3.5621337890625, 3.900146484375, 4.2381591796875, 4.576171875, 4.9141845703125, 5.252197265625, 5.5902099609375, 5.92822265625, 6.2662353515625, 6.604248046875, 6.9422607421875, 7.2802734375, 7.6182861328125, 7.956298828125, 8.2943115234375, 8.63232421875, 8.9703369140625, 9.308349609375, 9.6463623046875, 9.984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 0.0, 8.0, 6.0, 8.0, 11.0, 10.0, 14.0, 15.0, 29.0, 23.0, 45.0, 44.0, 60.0, 77.0, 71.0, 92.0, 101.0, 71.0, 67.0, 53.0, 36.0, 32.0, 29.0, 21.0, 19.0, 16.0, 11.0, 12.0, 7.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31640625, -2.2362060546875, -2.156005859375, -2.0758056640625, -1.99560546875, -1.9154052734375, -1.835205078125, -1.7550048828125, -1.6748046875, -1.5946044921875, -1.514404296875, -1.4342041015625, -1.35400390625, -1.2738037109375, -1.193603515625, -1.1134033203125, -1.033203125, -0.9530029296875, -0.872802734375, -0.7926025390625, -0.71240234375, -0.6322021484375, -0.552001953125, -0.4718017578125, -0.3916015625, -0.3114013671875, -0.231201171875, -0.1510009765625, -0.07080078125, 0.0093994140625, 0.089599609375, 0.1697998046875, 0.25, 0.3302001953125, 0.410400390625, 0.4906005859375, 0.57080078125, 0.6510009765625, 0.731201171875, 0.8114013671875, 0.8916015625, 0.9718017578125, 1.052001953125, 1.1322021484375, 1.21240234375, 1.2926025390625, 1.372802734375, 1.4530029296875, 1.533203125, 1.6134033203125, 1.693603515625, 1.7738037109375, 1.85400390625, 1.9342041015625, 2.014404296875, 2.0946044921875, 2.1748046875, 2.2550048828125, 2.335205078125, 2.4154052734375, 2.49560546875, 2.5758056640625, 2.656005859375, 2.7362060546875, 2.81640625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 8.0, 7.0, 17.0, 14.0, 13.0, 25.0, 32.0, 44.0, 44.0, 53.0, 69.0, 70.0, 64.0, 66.0, 56.0, 57.0, 79.0, 63.0, 35.0, 37.0, 31.0, 20.0, 20.0, 15.0, 9.0, 8.0, 10.0, 4.0, 1.0, 7.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.088653564453125, -34.002357482910156, -32.91605758666992, -31.829761505126953, -30.74346351623535, -29.65716552734375, -28.57086944580078, -27.48457145690918, -26.398273468017578, -25.311975479125977, -24.225677490234375, -23.139381408691406, -22.053083419799805, -20.966785430908203, -19.880489349365234, -18.794191360473633, -17.70789337158203, -16.62159538269043, -15.535298347473145, -14.44900131225586, -13.362703323364258, -12.276405334472656, -11.190108299255371, -10.103811264038086, -9.017513275146484, -7.931215763092041, -6.844918251037598, -5.758620738983154, -4.672323226928711, -3.5860257148742676, -2.499728202819824, -1.4134306907653809, -0.3271331787109375, 0.7591643333435059, 1.8454618453979492, 2.9317593574523926, 4.018056869506836, 5.104354381561279, 6.190651893615723, 7.276949405670166, 8.36324691772461, 9.449544906616211, 10.535841941833496, 11.622138977050781, 12.708436965942383, 13.794734954833984, 14.88103199005127, 15.967329025268555, 17.053627014160156, 18.139925003051758, 19.22622299194336, 20.312519073486328, 21.39881706237793, 22.48511505126953, 23.5714111328125, 24.6577091217041, 25.744007110595703, 26.830305099487305, 27.916603088378906, 29.002899169921875, 30.089197158813477, 31.175495147705078, 32.26179122924805, 33.34809112548828, 34.43438720703125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 10.0, 10.0, 10.0, 16.0, 16.0, 25.0, 18.0, 33.0, 36.0, 31.0, 28.0, 28.0, 29.0, 35.0, 38.0, 41.0, 47.0, 41.0, 38.0, 39.0, 47.0, 40.0, 30.0, 29.0, 24.0, 35.0, 27.0, 25.0, 22.0, 27.0, 17.0, 17.0, 12.0, 7.0, 12.0, 7.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.153217315673828, -25.315322875976562, -24.477428436279297, -23.639535903930664, -22.8016414642334, -21.963747024536133, -21.1258544921875, -20.287960052490234, -19.45006561279297, -18.612171173095703, -17.774276733398438, -16.936384201049805, -16.09848976135254, -15.260595321655273, -14.422701835632324, -13.584808349609375, -12.74691390991211, -11.909019470214844, -11.071125984191895, -10.233232498168945, -9.39533805847168, -8.557443618774414, -7.719550132751465, -6.881656169891357, -6.04376220703125, -5.205868244171143, -4.367974281311035, -3.5300803184509277, -2.6921863555908203, -1.854292392730713, -1.0163984298706055, -0.17850446701049805, 0.6593914031982422, 1.4972853660583496, 2.335179328918457, 3.1730732917785645, 4.010967254638672, 4.848861217498779, 5.686755180358887, 6.524649143218994, 7.362543106079102, 8.200437545776367, 9.038331031799316, 9.876224517822266, 10.714118957519531, 11.552013397216797, 12.389906883239746, 13.227800369262695, 14.065694808959961, 14.903589248657227, 15.741482734680176, 16.579376220703125, 17.41727066040039, 18.255165100097656, 19.093059539794922, 19.930952072143555, 20.76884651184082, 21.606740951538086, 22.44463348388672, 23.282527923583984, 24.12042236328125, 24.958316802978516, 25.79621124267578, 26.634103775024414, 27.47199821472168]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 6.0, 6.0, 11.0, 10.0, 30.0, 42.0, 66.0, 77.0, 115.0, 167.0, 243.0, 438.0, 580.0, 929.0, 1464.0, 2248.0, 3696.0, 5803.0, 9707.0, 16143.0, 28077.0, 49471.0, 89902.0, 163310.0, 240956.0, 189486.0, 106744.0, 58149.0, 32629.0, 18789.0, 10990.0, 6740.0, 4184.0, 2607.0, 1676.0, 1039.0, 693.0, 430.0, 300.0, 199.0, 150.0, 75.0, 62.0, 36.0, 20.0, 19.0, 12.0, 12.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.9375, -35.73193359375, -34.5263671875, -33.32080078125, -32.115234375, -30.90966796875, -29.7041015625, -28.49853515625, -27.29296875, -26.08740234375, -24.8818359375, -23.67626953125, -22.470703125, -21.26513671875, -20.0595703125, -18.85400390625, -17.6484375, -16.44287109375, -15.2373046875, -14.03173828125, -12.826171875, -11.62060546875, -10.4150390625, -9.20947265625, -8.00390625, -6.79833984375, -5.5927734375, -4.38720703125, -3.181640625, -1.97607421875, -0.7705078125, 0.43505859375, 1.640625, 2.84619140625, 4.0517578125, 5.25732421875, 6.462890625, 7.66845703125, 8.8740234375, 10.07958984375, 11.28515625, 12.49072265625, 13.6962890625, 14.90185546875, 16.107421875, 17.31298828125, 18.5185546875, 19.72412109375, 20.9296875, 22.13525390625, 23.3408203125, 24.54638671875, 25.751953125, 26.95751953125, 28.1630859375, 29.36865234375, 30.57421875, 31.77978515625, 32.9853515625, 34.19091796875, 35.396484375, 36.60205078125, 37.8076171875, 39.01318359375, 40.21875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 14.0, 12.0, 9.0, 10.0, 13.0, 12.0, 19.0, 20.0, 35.0, 35.0, 36.0, 35.0, 29.0, 33.0, 26.0, 41.0, 51.0, 44.0, 48.0, 48.0, 43.0, 30.0, 52.0, 38.0, 24.0, 32.0, 26.0, 27.0, 22.0, 19.0, 27.0, 16.0, 19.0, 14.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.515625, -26.6328125, -25.75, -24.8671875, -23.984375, -23.1015625, -22.21875, -21.3359375, -20.453125, -19.5703125, -18.6875, -17.8046875, -16.921875, -16.0390625, -15.15625, -14.2734375, -13.390625, -12.5078125, -11.625, -10.7421875, -9.859375, -8.9765625, -8.09375, -7.2109375, -6.328125, -5.4453125, -4.5625, -3.6796875, -2.796875, -1.9140625, -1.03125, -0.1484375, 0.734375, 1.6171875, 2.5, 3.3828125, 4.265625, 5.1484375, 6.03125, 6.9140625, 7.796875, 8.6796875, 9.5625, 10.4453125, 11.328125, 12.2109375, 13.09375, 13.9765625, 14.859375, 15.7421875, 16.625, 17.5078125, 18.390625, 19.2734375, 20.15625, 21.0390625, 21.921875, 22.8046875, 23.6875, 24.5703125, 25.453125, 26.3359375, 27.21875, 28.1015625, 28.984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 9.0, 19.0, 30.0, 45.0, 50.0, 80.0, 100.0, 136.0, 198.0, 285.0, 390.0, 628.0, 905.0, 1238.0, 1957.0, 2678.0, 3993.0, 5928.0, 9163.0, 14176.0, 22019.0, 33987.0, 54456.0, 86907.0, 132918.0, 177215.0, 168148.0, 119601.0, 76215.0, 48193.0, 30421.0, 19134.0, 12442.0, 8096.0, 5322.0, 3658.0, 2421.0, 1627.0, 1078.0, 852.0, 543.0, 395.0, 272.0, 189.0, 125.0, 85.0, 65.0, 52.0, 26.0, 31.0, 11.0, 14.0, 8.0, 11.0, 3.0, 1.0, 2.0, 3.0], "bins": [-32.53125, -31.51025390625, -30.4892578125, -29.46826171875, -28.447265625, -27.42626953125, -26.4052734375, -25.38427734375, -24.36328125, -23.34228515625, -22.3212890625, -21.30029296875, -20.279296875, -19.25830078125, -18.2373046875, -17.21630859375, -16.1953125, -15.17431640625, -14.1533203125, -13.13232421875, -12.111328125, -11.09033203125, -10.0693359375, -9.04833984375, -8.02734375, -7.00634765625, -5.9853515625, -4.96435546875, -3.943359375, -2.92236328125, -1.9013671875, -0.88037109375, 0.140625, 1.16162109375, 2.1826171875, 3.20361328125, 4.224609375, 5.24560546875, 6.2666015625, 7.28759765625, 8.30859375, 9.32958984375, 10.3505859375, 11.37158203125, 12.392578125, 13.41357421875, 14.4345703125, 15.45556640625, 16.4765625, 17.49755859375, 18.5185546875, 19.53955078125, 20.560546875, 21.58154296875, 22.6025390625, 23.62353515625, 24.64453125, 25.66552734375, 26.6865234375, 27.70751953125, 28.728515625, 29.74951171875, 30.7705078125, 31.79150390625, 32.8125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 12.0, 8.0, 10.0, 19.0, 15.0, 16.0, 22.0, 23.0, 29.0, 35.0, 41.0, 42.0, 44.0, 29.0, 40.0, 57.0, 49.0, 35.0, 46.0, 50.0, 51.0, 44.0, 34.0, 32.0, 36.0, 29.0, 28.0, 18.0, 20.0, 13.0, 10.0, 11.0, 12.0, 8.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.84375, -21.2021484375, -20.560546875, -19.9189453125, -19.27734375, -18.6357421875, -17.994140625, -17.3525390625, -16.7109375, -16.0693359375, -15.427734375, -14.7861328125, -14.14453125, -13.5029296875, -12.861328125, -12.2197265625, -11.578125, -10.9365234375, -10.294921875, -9.6533203125, -9.01171875, -8.3701171875, -7.728515625, -7.0869140625, -6.4453125, -5.8037109375, -5.162109375, -4.5205078125, -3.87890625, -3.2373046875, -2.595703125, -1.9541015625, -1.3125, -0.6708984375, -0.029296875, 0.6123046875, 1.25390625, 1.8955078125, 2.537109375, 3.1787109375, 3.8203125, 4.4619140625, 5.103515625, 5.7451171875, 6.38671875, 7.0283203125, 7.669921875, 8.3115234375, 8.953125, 9.5947265625, 10.236328125, 10.8779296875, 11.51953125, 12.1611328125, 12.802734375, 13.4443359375, 14.0859375, 14.7275390625, 15.369140625, 16.0107421875, 16.65234375, 17.2939453125, 17.935546875, 18.5771484375, 19.21875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 7.0, 4.0, 7.0, 8.0, 17.0, 18.0, 23.0, 57.0, 68.0, 127.0, 163.0, 285.0, 440.0, 856.0, 1379.0, 2435.0, 4581.0, 9096.0, 18975.0, 42703.0, 102665.0, 258287.0, 340391.0, 151950.0, 61396.0, 26562.0, 12362.0, 6187.0, 3248.0, 1709.0, 991.0, 584.0, 350.0, 206.0, 124.0, 95.0, 68.0, 50.0, 23.0, 18.0, 13.0, 14.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.21875, -17.61572265625, -17.0126953125, -16.40966796875, -15.806640625, -15.20361328125, -14.6005859375, -13.99755859375, -13.39453125, -12.79150390625, -12.1884765625, -11.58544921875, -10.982421875, -10.37939453125, -9.7763671875, -9.17333984375, -8.5703125, -7.96728515625, -7.3642578125, -6.76123046875, -6.158203125, -5.55517578125, -4.9521484375, -4.34912109375, -3.74609375, -3.14306640625, -2.5400390625, -1.93701171875, -1.333984375, -0.73095703125, -0.1279296875, 0.47509765625, 1.078125, 1.68115234375, 2.2841796875, 2.88720703125, 3.490234375, 4.09326171875, 4.6962890625, 5.29931640625, 5.90234375, 6.50537109375, 7.1083984375, 7.71142578125, 8.314453125, 8.91748046875, 9.5205078125, 10.12353515625, 10.7265625, 11.32958984375, 11.9326171875, 12.53564453125, 13.138671875, 13.74169921875, 14.3447265625, 14.94775390625, 15.55078125, 16.15380859375, 16.7568359375, 17.35986328125, 17.962890625, 18.56591796875, 19.1689453125, 19.77197265625, 20.375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 8.0, 5.0, 16.0, 25.0, 60.0, 74.0, 114.0, 131.0, 164.0, 143.0, 92.0, 66.0, 41.0, 16.0, 19.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036602020263671875, -0.0035697519779205322, -0.003479301929473877, -0.0033888518810272217, -0.0032984018325805664, -0.003207951784133911, -0.003117501735687256, -0.0030270516872406006, -0.0029366016387939453, -0.00284615159034729, -0.0027557015419006348, -0.0026652514934539795, -0.0025748014450073242, -0.002484351396560669, -0.0023939013481140137, -0.0023034512996673584, -0.002213001251220703, -0.002122551202774048, -0.0020321011543273926, -0.0019416511058807373, -0.001851201057434082, -0.0017607510089874268, -0.0016703009605407715, -0.0015798509120941162, -0.001489400863647461, -0.0013989508152008057, -0.0013085007667541504, -0.0012180507183074951, -0.0011276006698608398, -0.0010371506214141846, -0.0009467005729675293, -0.000856250524520874, -0.0007658004760742188, -0.0006753504276275635, -0.0005849003791809082, -0.0004944503307342529, -0.00040400028228759766, -0.0003135502338409424, -0.0002231001853942871, -0.00013265013694763184, -4.220008850097656e-05, 4.824995994567871e-05, 0.00013870000839233398, 0.00022915005683898926, 0.00031960010528564453, 0.0004100501537322998, 0.0005005002021789551, 0.0005909502506256104, 0.0006814002990722656, 0.0007718503475189209, 0.0008623003959655762, 0.0009527504444122314, 0.0010432004928588867, 0.001133650541305542, 0.0012241005897521973, 0.0013145506381988525, 0.0014050006866455078, 0.001495450735092163, 0.0015859007835388184, 0.0016763508319854736, 0.001766800880432129, 0.0018572509288787842, 0.0019477009773254395, 0.0020381510257720947, 0.00212860107421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 3.0, 8.0, 3.0, 6.0, 9.0, 14.0, 13.0, 32.0, 28.0, 41.0, 50.0, 66.0, 105.0, 143.0, 221.0, 266.0, 409.0, 664.0, 898.0, 1542.0, 2628.0, 4467.0, 7893.0, 14613.0, 29231.0, 61383.0, 134249.0, 265373.0, 264964.0, 134512.0, 61556.0, 28974.0, 14741.0, 7833.0, 4357.0, 2545.0, 1601.0, 1011.0, 685.0, 415.0, 292.0, 205.0, 140.0, 94.0, 72.0, 53.0, 43.0, 33.0, 24.0, 7.0, 13.0, 12.0, 10.0, 5.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.484375, -16.93798828125, -16.3916015625, -15.84521484375, -15.298828125, -14.75244140625, -14.2060546875, -13.65966796875, -13.11328125, -12.56689453125, -12.0205078125, -11.47412109375, -10.927734375, -10.38134765625, -9.8349609375, -9.28857421875, -8.7421875, -8.19580078125, -7.6494140625, -7.10302734375, -6.556640625, -6.01025390625, -5.4638671875, -4.91748046875, -4.37109375, -3.82470703125, -3.2783203125, -2.73193359375, -2.185546875, -1.63916015625, -1.0927734375, -0.54638671875, 0.0, 0.54638671875, 1.0927734375, 1.63916015625, 2.185546875, 2.73193359375, 3.2783203125, 3.82470703125, 4.37109375, 4.91748046875, 5.4638671875, 6.01025390625, 6.556640625, 7.10302734375, 7.6494140625, 8.19580078125, 8.7421875, 9.28857421875, 9.8349609375, 10.38134765625, 10.927734375, 11.47412109375, 12.0205078125, 12.56689453125, 13.11328125, 13.65966796875, 14.2060546875, 14.75244140625, 15.298828125, 15.84521484375, 16.3916015625, 16.93798828125, 17.484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 10.0, 8.0, 9.0, 9.0, 17.0, 23.0, 28.0, 40.0, 55.0, 64.0, 68.0, 92.0, 85.0, 91.0, 100.0, 67.0, 47.0, 46.0, 34.0, 16.0, 20.0, 12.0, 20.0, 10.0, 7.0, 8.0, 2.0, 9.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.54296875, -6.33160400390625, -6.1202392578125, -5.90887451171875, -5.697509765625, -5.48614501953125, -5.2747802734375, -5.06341552734375, -4.85205078125, -4.64068603515625, -4.4293212890625, -4.21795654296875, -4.006591796875, -3.79522705078125, -3.5838623046875, -3.37249755859375, -3.1611328125, -2.94976806640625, -2.7384033203125, -2.52703857421875, -2.315673828125, -2.10430908203125, -1.8929443359375, -1.68157958984375, -1.47021484375, -1.25885009765625, -1.0474853515625, -0.83612060546875, -0.624755859375, -0.41339111328125, -0.2020263671875, 0.00933837890625, 0.220703125, 0.43206787109375, 0.6434326171875, 0.85479736328125, 1.066162109375, 1.27752685546875, 1.4888916015625, 1.70025634765625, 1.91162109375, 2.12298583984375, 2.3343505859375, 2.54571533203125, 2.757080078125, 2.96844482421875, 3.1798095703125, 3.39117431640625, 3.6025390625, 3.81390380859375, 4.0252685546875, 4.23663330078125, 4.447998046875, 4.65936279296875, 4.8707275390625, 5.08209228515625, 5.29345703125, 5.50482177734375, 5.7161865234375, 5.92755126953125, 6.138916015625, 6.35028076171875, 6.5616455078125, 6.77301025390625, 6.984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 5.0, 4.0, 2.0, 13.0, 9.0, 14.0, 18.0, 29.0, 26.0, 28.0, 38.0, 41.0, 55.0, 38.0, 60.0, 51.0, 69.0, 65.0, 53.0, 62.0, 50.0, 46.0, 40.0, 31.0, 29.0, 24.0, 17.0, 12.0, 17.0, 8.0, 11.0, 3.0, 3.0, 9.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.605167388916016, -27.641395568847656, -26.67762565612793, -25.71385383605957, -24.75008201599121, -23.786312103271484, -22.822540283203125, -21.858768463134766, -20.894996643066406, -19.931224822998047, -18.96745491027832, -18.00368309020996, -17.0399112701416, -16.076141357421875, -15.112369537353516, -14.148597717285156, -13.18482780456543, -12.221056938171387, -11.257285118103027, -10.293514251708984, -9.329742431640625, -8.365971565246582, -7.402200698852539, -6.438429355621338, -5.474658012390137, -4.5108866691589355, -3.5471155643463135, -2.5833444595336914, -1.6195731163024902, -0.6558017730712891, 0.3079690933227539, 1.271740436553955, 2.2355117797851562, 3.1992831230163574, 4.163054466247559, 5.126825332641602, 6.090596675872803, 7.054368019104004, 8.018138885498047, 8.981910705566406, 9.94568157196045, 10.909452438354492, 11.873224258422852, 12.836995124816895, 13.800765991210938, 14.764537811279297, 15.72830867767334, 16.692079544067383, 17.655851364135742, 18.6196231842041, 19.583393096923828, 20.547164916992188, 21.510936737060547, 22.474708557128906, 23.438478469848633, 24.402250289916992, 25.36602020263672, 26.329792022705078, 27.293561935424805, 28.257333755493164, 29.221105575561523, 30.18487548828125, 31.14864730834961, 32.11241912841797, 33.07619094848633]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 9.0, 22.0, 10.0, 17.0, 20.0, 22.0, 35.0, 29.0, 38.0, 34.0, 41.0, 47.0, 31.0, 46.0, 34.0, 47.0, 44.0, 38.0, 49.0, 43.0, 36.0, 33.0, 35.0, 36.0, 37.0, 16.0, 28.0, 20.0, 21.0, 16.0, 8.0, 5.0, 7.0, 2.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.032825469970703, -26.050125122070312, -25.06742286682129, -24.0847225189209, -23.102020263671875, -22.119319915771484, -21.136619567871094, -20.15391731262207, -19.17121696472168, -18.18851661682129, -17.205814361572266, -16.223114013671875, -15.240412712097168, -14.257711410522461, -13.275010108947754, -12.292308807373047, -11.30960750579834, -10.326906204223633, -9.344204902648926, -8.361503601074219, -7.378803253173828, -6.396101951599121, -5.413400650024414, -4.430699825286865, -3.447998523712158, -2.4652974605560303, -1.4825962781906128, -0.4998950958251953, 0.4828059673309326, 1.4655070304870605, 2.4482083320617676, 3.4309091567993164, 4.413610458374023, 5.3963117599487305, 6.379012584686279, 7.361713886260986, 8.344414710998535, 9.327116012573242, 10.30981731414795, 11.292518615722656, 12.275218963623047, 13.257920265197754, 14.240621566772461, 15.223321914672852, 16.206024169921875, 17.188724517822266, 18.171424865722656, 19.15412712097168, 20.136829376220703, 21.119529724121094, 22.102231979370117, 23.084932327270508, 24.06763458251953, 25.050334930419922, 26.033035278320312, 27.015737533569336, 27.998437881469727, 28.981138229370117, 29.96384048461914, 30.94654083251953, 31.929243087768555, 32.91194152832031, 33.89464569091797, 34.87734603881836, 35.86004638671875]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 7.0, 3.0, 14.0, 20.0, 24.0, 55.0, 79.0, 131.0, 167.0, 234.0, 297.0, 439.0, 567.0, 876.0, 1287.0, 1775.0, 2838.0, 4263.0, 6501.0, 10682.0, 17277.0, 29531.0, 53876.0, 107253.0, 249101.0, 647771.0, 1288494.0, 1009853.0, 419475.0, 167094.0, 75940.0, 39902.0, 22446.0, 13199.0, 8167.0, 4925.0, 3263.0, 2065.0, 1430.0, 923.0, 641.0, 424.0, 297.0, 176.0, 131.0, 111.0, 76.0, 45.0, 48.0, 36.0, 23.0, 11.0, 9.0, 7.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-32.6875, -31.58935546875, -30.4912109375, -29.39306640625, -28.294921875, -27.19677734375, -26.0986328125, -25.00048828125, -23.90234375, -22.80419921875, -21.7060546875, -20.60791015625, -19.509765625, -18.41162109375, -17.3134765625, -16.21533203125, -15.1171875, -14.01904296875, -12.9208984375, -11.82275390625, -10.724609375, -9.62646484375, -8.5283203125, -7.43017578125, -6.33203125, -5.23388671875, -4.1357421875, -3.03759765625, -1.939453125, -0.84130859375, 0.2568359375, 1.35498046875, 2.453125, 3.55126953125, 4.6494140625, 5.74755859375, 6.845703125, 7.94384765625, 9.0419921875, 10.14013671875, 11.23828125, 12.33642578125, 13.4345703125, 14.53271484375, 15.630859375, 16.72900390625, 17.8271484375, 18.92529296875, 20.0234375, 21.12158203125, 22.2197265625, 23.31787109375, 24.416015625, 25.51416015625, 26.6123046875, 27.71044921875, 28.80859375, 29.90673828125, 31.0048828125, 32.10302734375, 33.201171875, 34.29931640625, 35.3974609375, 36.49560546875, 37.59375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 4.0, 6.0, 9.0, 12.0, 10.0, 21.0, 21.0, 22.0, 27.0, 31.0, 28.0, 36.0, 29.0, 31.0, 31.0, 45.0, 42.0, 37.0, 49.0, 53.0, 44.0, 45.0, 38.0, 36.0, 40.0, 27.0, 27.0, 38.0, 24.0, 20.0, 20.0, 18.0, 15.0, 12.0, 11.0, 5.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.140625, -22.302490234375, -21.46435546875, -20.626220703125, -19.7880859375, -18.949951171875, -18.11181640625, -17.273681640625, -16.435546875, -15.597412109375, -14.75927734375, -13.921142578125, -13.0830078125, -12.244873046875, -11.40673828125, -10.568603515625, -9.73046875, -8.892333984375, -8.05419921875, -7.216064453125, -6.3779296875, -5.539794921875, -4.70166015625, -3.863525390625, -3.025390625, -2.187255859375, -1.34912109375, -0.510986328125, 0.3271484375, 1.165283203125, 2.00341796875, 2.841552734375, 3.6796875, 4.517822265625, 5.35595703125, 6.194091796875, 7.0322265625, 7.870361328125, 8.70849609375, 9.546630859375, 10.384765625, 11.222900390625, 12.06103515625, 12.899169921875, 13.7373046875, 14.575439453125, 15.41357421875, 16.251708984375, 17.08984375, 17.927978515625, 18.76611328125, 19.604248046875, 20.4423828125, 21.280517578125, 22.11865234375, 22.956787109375, 23.794921875, 24.633056640625, 25.47119140625, 26.309326171875, 27.1474609375, 27.985595703125, 28.82373046875, 29.661865234375, 30.5]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 13.0, 19.0, 24.0, 42.0, 40.0, 76.0, 111.0, 176.0, 274.0, 433.0, 708.0, 1240.0, 2214.0, 4057.0, 7333.0, 14404.0, 28458.0, 60369.0, 136011.0, 341527.0, 971845.0, 1569859.0, 634232.0, 233085.0, 97480.0, 44507.0, 21347.0, 11012.0, 5792.0, 3156.0, 1812.0, 1018.0, 575.0, 366.0, 210.0, 152.0, 85.0, 70.0, 49.0, 28.0, 17.0, 17.0, 12.0, 8.0, 2.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-50.40625, -48.845703125, -47.28515625, -45.724609375, -44.1640625, -42.603515625, -41.04296875, -39.482421875, -37.921875, -36.361328125, -34.80078125, -33.240234375, -31.6796875, -30.119140625, -28.55859375, -26.998046875, -25.4375, -23.876953125, -22.31640625, -20.755859375, -19.1953125, -17.634765625, -16.07421875, -14.513671875, -12.953125, -11.392578125, -9.83203125, -8.271484375, -6.7109375, -5.150390625, -3.58984375, -2.029296875, -0.46875, 1.091796875, 2.65234375, 4.212890625, 5.7734375, 7.333984375, 8.89453125, 10.455078125, 12.015625, 13.576171875, 15.13671875, 16.697265625, 18.2578125, 19.818359375, 21.37890625, 22.939453125, 24.5, 26.060546875, 27.62109375, 29.181640625, 30.7421875, 32.302734375, 33.86328125, 35.423828125, 36.984375, 38.544921875, 40.10546875, 41.666015625, 43.2265625, 44.787109375, 46.34765625, 47.908203125, 49.46875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 7.0, 1.0, 2.0, 4.0, 8.0, 8.0, 16.0, 16.0, 16.0, 34.0, 39.0, 48.0, 68.0, 98.0, 106.0, 149.0, 178.0, 220.0, 296.0, 353.0, 381.0, 383.0, 309.0, 315.0, 240.0, 172.0, 138.0, 104.0, 97.0, 58.0, 57.0, 39.0, 27.0, 22.0, 22.0, 15.0, 16.0, 4.0, 12.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.546875, -13.066650390625, -12.58642578125, -12.106201171875, -11.6259765625, -11.145751953125, -10.66552734375, -10.185302734375, -9.705078125, -9.224853515625, -8.74462890625, -8.264404296875, -7.7841796875, -7.303955078125, -6.82373046875, -6.343505859375, -5.86328125, -5.383056640625, -4.90283203125, -4.422607421875, -3.9423828125, -3.462158203125, -2.98193359375, -2.501708984375, -2.021484375, -1.541259765625, -1.06103515625, -0.580810546875, -0.1005859375, 0.379638671875, 0.85986328125, 1.340087890625, 1.8203125, 2.300537109375, 2.78076171875, 3.260986328125, 3.7412109375, 4.221435546875, 4.70166015625, 5.181884765625, 5.662109375, 6.142333984375, 6.62255859375, 7.102783203125, 7.5830078125, 8.063232421875, 8.54345703125, 9.023681640625, 9.50390625, 9.984130859375, 10.46435546875, 10.944580078125, 11.4248046875, 11.905029296875, 12.38525390625, 12.865478515625, 13.345703125, 13.825927734375, 14.30615234375, 14.786376953125, 15.2666015625, 15.746826171875, 16.22705078125, 16.707275390625, 17.1875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 8.0, 8.0, 15.0, 16.0, 19.0, 18.0, 25.0, 45.0, 37.0, 47.0, 47.0, 55.0, 66.0, 66.0, 72.0, 74.0, 57.0, 52.0, 55.0, 34.0, 33.0, 31.0, 19.0, 13.0, 14.0, 14.0, 13.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.146879196166992, -28.024721145629883, -26.902563095092773, -25.78040313720703, -24.658245086669922, -23.536087036132812, -22.413928985595703, -21.291770935058594, -20.169612884521484, -19.047454833984375, -17.925296783447266, -16.803138732910156, -15.680978775024414, -14.558820724487305, -13.436662673950195, -12.314504623413086, -11.192344665527344, -10.070186614990234, -8.948027610778809, -7.825869560241699, -6.703711032867432, -5.581552505493164, -4.459394454956055, -3.337235927581787, -2.2150774002075195, -1.0929189920425415, 0.029239416122436523, 1.151397705078125, 2.2735562324523926, 3.39571475982666, 4.5178728103637695, 5.640031337738037, 6.762187957763672, 7.8843464851379395, 9.006505012512207, 10.128663063049316, 11.250822067260742, 12.372980117797852, 13.495138168334961, 14.61729621887207, 15.739455223083496, 16.861614227294922, 17.98377227783203, 19.10593032836914, 20.22808837890625, 21.35024642944336, 22.47240447998047, 23.59456443786621, 24.71672248840332, 25.83888053894043, 26.96103858947754, 28.08319854736328, 29.20535659790039, 30.3275146484375, 31.44967269897461, 32.57183074951172, 33.69398880004883, 34.81614685058594, 35.93830490112305, 37.060462951660156, 38.182621002197266, 39.304779052734375, 40.42694091796875, 41.54909896850586, 42.67125701904297]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 5.0, 4.0, 7.0, 5.0, 7.0, 11.0, 10.0, 11.0, 8.0, 23.0, 25.0, 18.0, 34.0, 33.0, 18.0, 30.0, 41.0, 42.0, 46.0, 40.0, 26.0, 41.0, 38.0, 40.0, 44.0, 40.0, 47.0, 50.0, 28.0, 35.0, 39.0, 23.0, 16.0, 16.0, 26.0, 18.0, 18.0, 6.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.92987823486328, -26.966094970703125, -26.00231170654297, -25.03852653503418, -24.074743270874023, -23.110960006713867, -22.14717674255371, -21.183391571044922, -20.219608306884766, -19.25582504272461, -18.292041778564453, -17.328256607055664, -16.364473342895508, -15.400690078735352, -14.436906814575195, -13.473122596740723, -12.509339332580566, -11.54555606842041, -10.581771850585938, -9.617988586425781, -8.654204368591309, -7.690421104431152, -6.726637363433838, -5.762853622436523, -4.799069881439209, -3.8352861404418945, -2.87150239944458, -1.9077188968658447, -0.9439351558685303, 0.019848346710205078, 0.9836320877075195, 1.947415828704834, 2.9111995697021484, 3.874983310699463, 4.838767051696777, 5.802550315856934, 6.766334533691406, 7.7301177978515625, 8.693901062011719, 9.657685279846191, 10.621469497680664, 11.58525276184082, 12.549036979675293, 13.51282024383545, 14.476604461669922, 15.440387725830078, 16.404170989990234, 17.36795425415039, 18.331737518310547, 19.295520782470703, 20.25930404663086, 21.22308921813965, 22.186872482299805, 23.15065574645996, 24.114439010620117, 25.078224182128906, 26.042007446289062, 27.00579071044922, 27.969573974609375, 28.933359146118164, 29.89714241027832, 30.860925674438477, 31.824708938598633, 32.78849411010742, 33.75227737426758]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 6.0, 11.0, 20.0, 33.0, 37.0, 48.0, 70.0, 133.0, 171.0, 260.0, 360.0, 653.0, 899.0, 1351.0, 2044.0, 3177.0, 5166.0, 8392.0, 13912.0, 23654.0, 43074.0, 80186.0, 161704.0, 274271.0, 202797.0, 101878.0, 52046.0, 28734.0, 16783.0, 9815.0, 6058.0, 3768.0, 2376.0, 1610.0, 1025.0, 642.0, 473.0, 293.0, 188.0, 129.0, 79.0, 69.0, 48.0, 33.0, 23.0, 16.0, 12.0, 9.0, 8.0, 4.0, 3.0, 0.0, 2.0], "bins": [-23.453125, -22.776611328125, -22.10009765625, -21.423583984375, -20.7470703125, -20.070556640625, -19.39404296875, -18.717529296875, -18.041015625, -17.364501953125, -16.68798828125, -16.011474609375, -15.3349609375, -14.658447265625, -13.98193359375, -13.305419921875, -12.62890625, -11.952392578125, -11.27587890625, -10.599365234375, -9.9228515625, -9.246337890625, -8.56982421875, -7.893310546875, -7.216796875, -6.540283203125, -5.86376953125, -5.187255859375, -4.5107421875, -3.834228515625, -3.15771484375, -2.481201171875, -1.8046875, -1.128173828125, -0.45166015625, 0.224853515625, 0.9013671875, 1.577880859375, 2.25439453125, 2.930908203125, 3.607421875, 4.283935546875, 4.96044921875, 5.636962890625, 6.3134765625, 6.989990234375, 7.66650390625, 8.343017578125, 9.01953125, 9.696044921875, 10.37255859375, 11.049072265625, 11.7255859375, 12.402099609375, 13.07861328125, 13.755126953125, 14.431640625, 15.108154296875, 15.78466796875, 16.461181640625, 17.1376953125, 17.814208984375, 18.49072265625, 19.167236328125, 19.84375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 7.0, 6.0, 10.0, 7.0, 3.0, 16.0, 17.0, 17.0, 27.0, 25.0, 29.0, 34.0, 22.0, 41.0, 55.0, 43.0, 48.0, 40.0, 42.0, 46.0, 35.0, 48.0, 43.0, 43.0, 36.0, 37.0, 34.0, 33.0, 21.0, 21.0, 17.0, 27.0, 12.0, 9.0, 6.0, 7.0, 3.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.40625, -27.38427734375, -26.3623046875, -25.34033203125, -24.318359375, -23.29638671875, -22.2744140625, -21.25244140625, -20.23046875, -19.20849609375, -18.1865234375, -17.16455078125, -16.142578125, -15.12060546875, -14.0986328125, -13.07666015625, -12.0546875, -11.03271484375, -10.0107421875, -8.98876953125, -7.966796875, -6.94482421875, -5.9228515625, -4.90087890625, -3.87890625, -2.85693359375, -1.8349609375, -0.81298828125, 0.208984375, 1.23095703125, 2.2529296875, 3.27490234375, 4.296875, 5.31884765625, 6.3408203125, 7.36279296875, 8.384765625, 9.40673828125, 10.4287109375, 11.45068359375, 12.47265625, 13.49462890625, 14.5166015625, 15.53857421875, 16.560546875, 17.58251953125, 18.6044921875, 19.62646484375, 20.6484375, 21.67041015625, 22.6923828125, 23.71435546875, 24.736328125, 25.75830078125, 26.7802734375, 27.80224609375, 28.82421875, 29.84619140625, 30.8681640625, 31.89013671875, 32.912109375, 33.93408203125, 34.9560546875, 35.97802734375, 37.0]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 12.0, 18.0, 20.0, 41.0, 40.0, 68.0, 107.0, 152.0, 255.0, 356.0, 562.0, 782.0, 1285.0, 2028.0, 3064.0, 4784.0, 7908.0, 12806.0, 22322.0, 40218.0, 80458.0, 185266.0, 331329.0, 179958.0, 79122.0, 40135.0, 21787.0, 12796.0, 7599.0, 4759.0, 2952.0, 1882.0, 1245.0, 840.0, 552.0, 364.0, 231.0, 168.0, 88.0, 52.0, 46.0, 27.0, 23.0, 13.0, 14.0, 11.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.21875, -28.26025390625, -27.3017578125, -26.34326171875, -25.384765625, -24.42626953125, -23.4677734375, -22.50927734375, -21.55078125, -20.59228515625, -19.6337890625, -18.67529296875, -17.716796875, -16.75830078125, -15.7998046875, -14.84130859375, -13.8828125, -12.92431640625, -11.9658203125, -11.00732421875, -10.048828125, -9.09033203125, -8.1318359375, -7.17333984375, -6.21484375, -5.25634765625, -4.2978515625, -3.33935546875, -2.380859375, -1.42236328125, -0.4638671875, 0.49462890625, 1.453125, 2.41162109375, 3.3701171875, 4.32861328125, 5.287109375, 6.24560546875, 7.2041015625, 8.16259765625, 9.12109375, 10.07958984375, 11.0380859375, 11.99658203125, 12.955078125, 13.91357421875, 14.8720703125, 15.83056640625, 16.7890625, 17.74755859375, 18.7060546875, 19.66455078125, 20.623046875, 21.58154296875, 22.5400390625, 23.49853515625, 24.45703125, 25.41552734375, 26.3740234375, 27.33251953125, 28.291015625, 29.24951171875, 30.2080078125, 31.16650390625, 32.125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 8.0, 5.0, 5.0, 7.0, 5.0, 8.0, 13.0, 10.0, 17.0, 15.0, 16.0, 22.0, 31.0, 22.0, 27.0, 23.0, 38.0, 29.0, 29.0, 50.0, 34.0, 36.0, 44.0, 38.0, 36.0, 38.0, 40.0, 41.0, 38.0, 34.0, 34.0, 29.0, 33.0, 21.0, 17.0, 22.0, 19.0, 10.0, 11.0, 11.0, 8.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.34375, -18.75244140625, -18.1611328125, -17.56982421875, -16.978515625, -16.38720703125, -15.7958984375, -15.20458984375, -14.61328125, -14.02197265625, -13.4306640625, -12.83935546875, -12.248046875, -11.65673828125, -11.0654296875, -10.47412109375, -9.8828125, -9.29150390625, -8.7001953125, -8.10888671875, -7.517578125, -6.92626953125, -6.3349609375, -5.74365234375, -5.15234375, -4.56103515625, -3.9697265625, -3.37841796875, -2.787109375, -2.19580078125, -1.6044921875, -1.01318359375, -0.421875, 0.16943359375, 0.7607421875, 1.35205078125, 1.943359375, 2.53466796875, 3.1259765625, 3.71728515625, 4.30859375, 4.89990234375, 5.4912109375, 6.08251953125, 6.673828125, 7.26513671875, 7.8564453125, 8.44775390625, 9.0390625, 9.63037109375, 10.2216796875, 10.81298828125, 11.404296875, 11.99560546875, 12.5869140625, 13.17822265625, 13.76953125, 14.36083984375, 14.9521484375, 15.54345703125, 16.134765625, 16.72607421875, 17.3173828125, 17.90869140625, 18.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 6.0, 9.0, 9.0, 12.0, 19.0, 28.0, 31.0, 48.0, 83.0, 94.0, 187.0, 297.0, 445.0, 845.0, 1506.0, 2967.0, 5936.0, 13104.0, 30892.0, 81385.0, 233454.0, 394767.0, 175024.0, 62221.0, 24110.0, 10579.0, 4885.0, 2500.0, 1262.0, 744.0, 410.0, 256.0, 147.0, 96.0, 56.0, 44.0, 32.0, 17.0, 16.0, 3.0, 4.0, 7.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.078125, -9.7667236328125, -9.455322265625, -9.1439208984375, -8.83251953125, -8.5211181640625, -8.209716796875, -7.8983154296875, -7.5869140625, -7.2755126953125, -6.964111328125, -6.6527099609375, -6.34130859375, -6.0299072265625, -5.718505859375, -5.4071044921875, -5.095703125, -4.7843017578125, -4.472900390625, -4.1614990234375, -3.85009765625, -3.5386962890625, -3.227294921875, -2.9158935546875, -2.6044921875, -2.2930908203125, -1.981689453125, -1.6702880859375, -1.35888671875, -1.0474853515625, -0.736083984375, -0.4246826171875, -0.11328125, 0.1981201171875, 0.509521484375, 0.8209228515625, 1.13232421875, 1.4437255859375, 1.755126953125, 2.0665283203125, 2.3779296875, 2.6893310546875, 3.000732421875, 3.3121337890625, 3.62353515625, 3.9349365234375, 4.246337890625, 4.5577392578125, 4.869140625, 5.1805419921875, 5.491943359375, 5.8033447265625, 6.11474609375, 6.4261474609375, 6.737548828125, 7.0489501953125, 7.3603515625, 7.6717529296875, 7.983154296875, 8.2945556640625, 8.60595703125, 8.9173583984375, 9.228759765625, 9.5401611328125, 9.8515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 11.0, 15.0, 17.0, 26.0, 37.0, 47.0, 54.0, 75.0, 50.0, 81.0, 69.0, 90.0, 75.0, 62.0, 55.0, 50.0, 40.0, 28.0, 25.0, 19.0, 14.0, 12.0, 7.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.0009746551513671875, -0.0009489357471466064, -0.0009232163429260254, -0.0008974969387054443, -0.0008717775344848633, -0.0008460581302642822, -0.0008203387260437012, -0.0007946193218231201, -0.0007688999176025391, -0.000743180513381958, -0.000717461109161377, -0.0006917417049407959, -0.0006660223007202148, -0.0006403028964996338, -0.0006145834922790527, -0.0005888640880584717, -0.0005631446838378906, -0.0005374252796173096, -0.0005117058753967285, -0.00048598647117614746, -0.0004602670669555664, -0.00043454766273498535, -0.0004088282585144043, -0.00038310885429382324, -0.0003573894500732422, -0.00033167004585266113, -0.0003059506416320801, -0.000280231237411499, -0.00025451183319091797, -0.00022879242897033691, -0.00020307302474975586, -0.0001773536205291748, -0.00015163421630859375, -0.0001259148120880127, -0.00010019540786743164, -7.447600364685059e-05, -4.875659942626953e-05, -2.3037195205688477e-05, 2.682209014892578e-06, 2.8401613235473633e-05, 5.412101745605469e-05, 7.984042167663574e-05, 0.0001055598258972168, 0.00013127923011779785, 0.0001569986343383789, 0.00018271803855895996, 0.00020843744277954102, 0.00023415684700012207, 0.0002598762512207031, 0.0002855956554412842, 0.00031131505966186523, 0.0003370344638824463, 0.00036275386810302734, 0.0003884732723236084, 0.00041419267654418945, 0.0004399120807647705, 0.00046563148498535156, 0.0004913508892059326, 0.0005170702934265137, 0.0005427896976470947, 0.0005685091018676758, 0.0005942285060882568, 0.0006199479103088379, 0.0006456673145294189, 0.00067138671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 6.0, 9.0, 12.0, 23.0, 20.0, 27.0, 35.0, 61.0, 86.0, 112.0, 179.0, 244.0, 317.0, 441.0, 635.0, 887.0, 1268.0, 2043.0, 3154.0, 4952.0, 7859.0, 13185.0, 22901.0, 40634.0, 74186.0, 135201.0, 213936.0, 214713.0, 135990.0, 75239.0, 41260.0, 23166.0, 13337.0, 8001.0, 4844.0, 3214.0, 2028.0, 1304.0, 920.0, 640.0, 439.0, 301.0, 198.0, 155.0, 110.0, 73.0, 51.0, 53.0, 33.0, 23.0, 23.0, 9.0, 12.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.51171875, -7.26947021484375, -7.0272216796875, -6.78497314453125, -6.542724609375, -6.30047607421875, -6.0582275390625, -5.81597900390625, -5.57373046875, -5.33148193359375, -5.0892333984375, -4.84698486328125, -4.604736328125, -4.36248779296875, -4.1202392578125, -3.87799072265625, -3.6357421875, -3.39349365234375, -3.1512451171875, -2.90899658203125, -2.666748046875, -2.42449951171875, -2.1822509765625, -1.94000244140625, -1.69775390625, -1.45550537109375, -1.2132568359375, -0.97100830078125, -0.728759765625, -0.48651123046875, -0.2442626953125, -0.00201416015625, 0.240234375, 0.48248291015625, 0.7247314453125, 0.96697998046875, 1.209228515625, 1.45147705078125, 1.6937255859375, 1.93597412109375, 2.17822265625, 2.42047119140625, 2.6627197265625, 2.90496826171875, 3.147216796875, 3.38946533203125, 3.6317138671875, 3.87396240234375, 4.1162109375, 4.35845947265625, 4.6007080078125, 4.84295654296875, 5.085205078125, 5.32745361328125, 5.5697021484375, 5.81195068359375, 6.05419921875, 6.29644775390625, 6.5386962890625, 6.78094482421875, 7.023193359375, 7.26544189453125, 7.5076904296875, 7.74993896484375, 7.9921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 4.0, 13.0, 9.0, 14.0, 25.0, 29.0, 32.0, 40.0, 29.0, 25.0, 37.0, 56.0, 51.0, 55.0, 61.0, 56.0, 54.0, 59.0, 57.0, 36.0, 38.0, 32.0, 32.0, 13.0, 29.0, 14.0, 12.0, 14.0, 14.0, 13.0, 4.0, 6.0, 2.0, 5.0, 1.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.544921875, -2.466522216796875, -2.38812255859375, -2.309722900390625, -2.2313232421875, -2.152923583984375, -2.07452392578125, -1.996124267578125, -1.917724609375, -1.839324951171875, -1.76092529296875, -1.682525634765625, -1.6041259765625, -1.525726318359375, -1.44732666015625, -1.368927001953125, -1.29052734375, -1.212127685546875, -1.13372802734375, -1.055328369140625, -0.9769287109375, -0.898529052734375, -0.82012939453125, -0.741729736328125, -0.663330078125, -0.584930419921875, -0.50653076171875, -0.428131103515625, -0.3497314453125, -0.271331787109375, -0.19293212890625, -0.114532470703125, -0.0361328125, 0.042266845703125, 0.12066650390625, 0.199066162109375, 0.2774658203125, 0.355865478515625, 0.43426513671875, 0.512664794921875, 0.591064453125, 0.669464111328125, 0.74786376953125, 0.826263427734375, 0.9046630859375, 0.983062744140625, 1.06146240234375, 1.139862060546875, 1.21826171875, 1.296661376953125, 1.37506103515625, 1.453460693359375, 1.5318603515625, 1.610260009765625, 1.68865966796875, 1.767059326171875, 1.845458984375, 1.923858642578125, 2.00225830078125, 2.080657958984375, 2.1590576171875, 2.237457275390625, 2.31585693359375, 2.394256591796875, 2.47265625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 13.0, 11.0, 11.0, 14.0, 20.0, 20.0, 22.0, 33.0, 39.0, 43.0, 52.0, 62.0, 60.0, 71.0, 74.0, 71.0, 62.0, 46.0, 56.0, 39.0, 40.0, 30.0, 20.0, 19.0, 14.0, 16.0, 9.0, 6.0, 4.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.11594581604004, -28.96799659729004, -27.820049285888672, -26.672100067138672, -25.524152755737305, -24.376203536987305, -23.228256225585938, -22.080307006835938, -20.932357788085938, -19.784408569335938, -18.63646125793457, -17.48851203918457, -16.340564727783203, -15.192615509033203, -14.04466724395752, -12.896718978881836, -11.748771667480469, -10.600823402404785, -9.452875137329102, -8.304925918579102, -7.156978130340576, -6.009029865264893, -4.861081123352051, -3.713132858276367, -2.5651845932006836, -1.4172362089157104, -0.2692878246307373, 0.8786606788635254, 2.026608943939209, 3.1745572090148926, 4.322505950927734, 5.470454216003418, 6.618400573730469, 7.766348838806152, 8.914297103881836, 10.062246322631836, 11.210193634033203, 12.358142852783203, 13.506091117858887, 14.65403938293457, 15.801987648010254, 16.949935913085938, 18.097885131835938, 19.245832443237305, 20.393781661987305, 21.541728973388672, 22.689678192138672, 23.837627410888672, 24.98557472229004, 26.13352394104004, 27.281471252441406, 28.429420471191406, 29.577367782592773, 30.725317001342773, 31.87326431274414, 33.02121353149414, 34.16916275024414, 35.31711196899414, 36.46506118774414, 37.613006591796875, 38.760955810546875, 39.908905029296875, 41.056854248046875, 42.204803466796875, 43.35274887084961]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 5.0, 3.0, 8.0, 9.0, 16.0, 4.0, 14.0, 17.0, 23.0, 20.0, 27.0, 34.0, 28.0, 32.0, 43.0, 36.0, 48.0, 34.0, 33.0, 40.0, 36.0, 41.0, 46.0, 36.0, 46.0, 45.0, 39.0, 38.0, 33.0, 21.0, 16.0, 19.0, 22.0, 22.0, 15.0, 7.0, 8.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.48418617248535, -26.535245895385742, -25.586307525634766, -24.637367248535156, -23.688426971435547, -22.739486694335938, -21.79054832458496, -20.84160804748535, -19.892669677734375, -18.943729400634766, -17.99479103088379, -17.04585075378418, -16.09691047668457, -15.147971153259277, -14.199031829833984, -13.250091552734375, -12.301151275634766, -11.352211952209473, -10.403271675109863, -9.45433235168457, -8.505392074584961, -7.556452751159668, -6.607513427734375, -5.658573627471924, -4.709633827209473, -3.7606940269470215, -2.8117544651031494, -1.8628149032592773, -0.9138751029968262, 0.035064697265625, 0.984004020690918, 1.9329438209533691, 2.8818817138671875, 3.8308215141296387, 4.77976131439209, 5.728700637817383, 6.677640438079834, 7.626580238342285, 8.575519561767578, 9.524459838867188, 10.47339916229248, 11.422338485717773, 12.371278762817383, 13.320218086242676, 14.269157409667969, 15.218097686767578, 16.167037963867188, 17.115976333618164, 18.064916610717773, 19.013856887817383, 19.96279525756836, 20.91173553466797, 21.860675811767578, 22.809616088867188, 23.758554458618164, 24.707494735717773, 25.65643310546875, 26.60537338256836, 27.554311752319336, 28.503252029418945, 29.452192306518555, 30.40113067626953, 31.35007095336914, 32.29901123046875, 33.24795150756836]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 12.0, 22.0, 43.0, 37.0, 48.0, 69.0, 118.0, 143.0, 234.0, 252.0, 473.0, 643.0, 999.0, 1507.0, 2341.0, 3582.0, 5815.0, 9469.0, 15864.0, 26251.0, 44416.0, 75638.0, 127650.0, 190309.0, 199100.0, 138370.0, 82855.0, 48474.0, 28547.0, 17055.0, 10408.0, 6307.0, 3933.0, 2609.0, 1576.0, 1102.0, 702.0, 487.0, 316.0, 227.0, 181.0, 121.0, 71.0, 48.0, 49.0, 26.0, 14.0, 11.0, 15.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.09375, -34.9326171875, -33.771484375, -32.6103515625, -31.44921875, -30.2880859375, -29.126953125, -27.9658203125, -26.8046875, -25.6435546875, -24.482421875, -23.3212890625, -22.16015625, -20.9990234375, -19.837890625, -18.6767578125, -17.515625, -16.3544921875, -15.193359375, -14.0322265625, -12.87109375, -11.7099609375, -10.548828125, -9.3876953125, -8.2265625, -7.0654296875, -5.904296875, -4.7431640625, -3.58203125, -2.4208984375, -1.259765625, -0.0986328125, 1.0625, 2.2236328125, 3.384765625, 4.5458984375, 5.70703125, 6.8681640625, 8.029296875, 9.1904296875, 10.3515625, 11.5126953125, 12.673828125, 13.8349609375, 14.99609375, 16.1572265625, 17.318359375, 18.4794921875, 19.640625, 20.8017578125, 21.962890625, 23.1240234375, 24.28515625, 25.4462890625, 26.607421875, 27.7685546875, 28.9296875, 30.0908203125, 31.251953125, 32.4130859375, 33.57421875, 34.7353515625, 35.896484375, 37.0576171875, 38.21875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 2.0, 3.0, 8.0, 14.0, 9.0, 13.0, 18.0, 19.0, 14.0, 25.0, 36.0, 36.0, 29.0, 33.0, 47.0, 51.0, 36.0, 38.0, 39.0, 42.0, 50.0, 48.0, 39.0, 58.0, 34.0, 33.0, 36.0, 27.0, 25.0, 24.0, 24.0, 11.0, 20.0, 15.0, 6.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.546875, -27.561279296875, -26.57568359375, -25.590087890625, -24.6044921875, -23.618896484375, -22.63330078125, -21.647705078125, -20.662109375, -19.676513671875, -18.69091796875, -17.705322265625, -16.7197265625, -15.734130859375, -14.74853515625, -13.762939453125, -12.77734375, -11.791748046875, -10.80615234375, -9.820556640625, -8.8349609375, -7.849365234375, -6.86376953125, -5.878173828125, -4.892578125, -3.906982421875, -2.92138671875, -1.935791015625, -0.9501953125, 0.035400390625, 1.02099609375, 2.006591796875, 2.9921875, 3.977783203125, 4.96337890625, 5.948974609375, 6.9345703125, 7.920166015625, 8.90576171875, 9.891357421875, 10.876953125, 11.862548828125, 12.84814453125, 13.833740234375, 14.8193359375, 15.804931640625, 16.79052734375, 17.776123046875, 18.76171875, 19.747314453125, 20.73291015625, 21.718505859375, 22.7041015625, 23.689697265625, 24.67529296875, 25.660888671875, 26.646484375, 27.632080078125, 28.61767578125, 29.603271484375, 30.5888671875, 31.574462890625, 32.56005859375, 33.545654296875, 34.53125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 13.0, 17.0, 13.0, 38.0, 46.0, 60.0, 82.0, 133.0, 180.0, 300.0, 419.0, 588.0, 921.0, 1311.0, 1973.0, 2965.0, 4521.0, 6793.0, 10234.0, 15872.0, 24676.0, 39124.0, 61328.0, 96746.0, 146143.0, 183297.0, 156526.0, 105962.0, 67385.0, 43086.0, 27016.0, 17334.0, 11242.0, 7440.0, 4860.0, 3257.0, 2127.0, 1471.0, 946.0, 658.0, 472.0, 287.0, 235.0, 138.0, 107.0, 68.0, 53.0, 32.0, 25.0, 10.0, 7.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.65625, -32.59130859375, -31.5263671875, -30.46142578125, -29.396484375, -28.33154296875, -27.2666015625, -26.20166015625, -25.13671875, -24.07177734375, -23.0068359375, -21.94189453125, -20.876953125, -19.81201171875, -18.7470703125, -17.68212890625, -16.6171875, -15.55224609375, -14.4873046875, -13.42236328125, -12.357421875, -11.29248046875, -10.2275390625, -9.16259765625, -8.09765625, -7.03271484375, -5.9677734375, -4.90283203125, -3.837890625, -2.77294921875, -1.7080078125, -0.64306640625, 0.421875, 1.48681640625, 2.5517578125, 3.61669921875, 4.681640625, 5.74658203125, 6.8115234375, 7.87646484375, 8.94140625, 10.00634765625, 11.0712890625, 12.13623046875, 13.201171875, 14.26611328125, 15.3310546875, 16.39599609375, 17.4609375, 18.52587890625, 19.5908203125, 20.65576171875, 21.720703125, 22.78564453125, 23.8505859375, 24.91552734375, 25.98046875, 27.04541015625, 28.1103515625, 29.17529296875, 30.240234375, 31.30517578125, 32.3701171875, 33.43505859375, 34.5]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 13.0, 9.0, 11.0, 13.0, 16.0, 23.0, 17.0, 26.0, 24.0, 33.0, 41.0, 31.0, 24.0, 42.0, 44.0, 46.0, 40.0, 46.0, 39.0, 40.0, 32.0, 33.0, 30.0, 34.0, 38.0, 35.0, 27.0, 19.0, 27.0, 19.0, 26.0, 7.0, 16.0, 15.0, 9.0, 6.0, 14.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-20.03125, -19.42626953125, -18.8212890625, -18.21630859375, -17.611328125, -17.00634765625, -16.4013671875, -15.79638671875, -15.19140625, -14.58642578125, -13.9814453125, -13.37646484375, -12.771484375, -12.16650390625, -11.5615234375, -10.95654296875, -10.3515625, -9.74658203125, -9.1416015625, -8.53662109375, -7.931640625, -7.32666015625, -6.7216796875, -6.11669921875, -5.51171875, -4.90673828125, -4.3017578125, -3.69677734375, -3.091796875, -2.48681640625, -1.8818359375, -1.27685546875, -0.671875, -0.06689453125, 0.5380859375, 1.14306640625, 1.748046875, 2.35302734375, 2.9580078125, 3.56298828125, 4.16796875, 4.77294921875, 5.3779296875, 5.98291015625, 6.587890625, 7.19287109375, 7.7978515625, 8.40283203125, 9.0078125, 9.61279296875, 10.2177734375, 10.82275390625, 11.427734375, 12.03271484375, 12.6376953125, 13.24267578125, 13.84765625, 14.45263671875, 15.0576171875, 15.66259765625, 16.267578125, 16.87255859375, 17.4775390625, 18.08251953125, 18.6875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 14.0, 15.0, 18.0, 31.0, 59.0, 75.0, 85.0, 129.0, 196.0, 296.0, 445.0, 623.0, 910.0, 1276.0, 1935.0, 2861.0, 4666.0, 7178.0, 12050.0, 20247.0, 36016.0, 65074.0, 115439.0, 194141.0, 226680.0, 153817.0, 87139.0, 48445.0, 26973.0, 15623.0, 9274.0, 5688.0, 3673.0, 2359.0, 1588.0, 1090.0, 736.0, 517.0, 373.0, 230.0, 171.0, 118.0, 75.0, 61.0, 38.0, 30.0, 28.0, 20.0, 12.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.9140625, -13.482666015625, -13.05126953125, -12.619873046875, -12.1884765625, -11.757080078125, -11.32568359375, -10.894287109375, -10.462890625, -10.031494140625, -9.60009765625, -9.168701171875, -8.7373046875, -8.305908203125, -7.87451171875, -7.443115234375, -7.01171875, -6.580322265625, -6.14892578125, -5.717529296875, -5.2861328125, -4.854736328125, -4.42333984375, -3.991943359375, -3.560546875, -3.129150390625, -2.69775390625, -2.266357421875, -1.8349609375, -1.403564453125, -0.97216796875, -0.540771484375, -0.109375, 0.322021484375, 0.75341796875, 1.184814453125, 1.6162109375, 2.047607421875, 2.47900390625, 2.910400390625, 3.341796875, 3.773193359375, 4.20458984375, 4.635986328125, 5.0673828125, 5.498779296875, 5.93017578125, 6.361572265625, 6.79296875, 7.224365234375, 7.65576171875, 8.087158203125, 8.5185546875, 8.949951171875, 9.38134765625, 9.812744140625, 10.244140625, 10.675537109375, 11.10693359375, 11.538330078125, 11.9697265625, 12.401123046875, 12.83251953125, 13.263916015625, 13.6953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 6.0, 13.0, 18.0, 27.0, 27.0, 43.0, 61.0, 55.0, 78.0, 103.0, 104.0, 93.0, 91.0, 56.0, 52.0, 37.0, 31.0, 24.0, 20.0, 16.0, 9.0, 13.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019588470458984375, -0.0019006580114364624, -0.0018424689769744873, -0.0017842799425125122, -0.0017260909080505371, -0.001667901873588562, -0.001609712839126587, -0.0015515238046646118, -0.0014933347702026367, -0.0014351457357406616, -0.0013769567012786865, -0.0013187676668167114, -0.0012605786323547363, -0.0012023895978927612, -0.0011442005634307861, -0.001086011528968811, -0.001027822494506836, -0.0009696334600448608, -0.0009114444255828857, -0.0008532553911209106, -0.0007950663566589355, -0.0007368773221969604, -0.0006786882877349854, -0.0006204992532730103, -0.0005623102188110352, -0.0005041211843490601, -0.00044593214988708496, -0.00038774311542510986, -0.00032955408096313477, -0.00027136504650115967, -0.00021317601203918457, -0.00015498697757720947, -9.679794311523438e-05, -3.860890865325928e-05, 1.958012580871582e-05, 7.776916027069092e-05, 0.00013595819473266602, 0.0001941472291946411, 0.0002523362636566162, 0.0003105252981185913, 0.0003687143325805664, 0.0004269033670425415, 0.0004850924015045166, 0.0005432814359664917, 0.0006014704704284668, 0.0006596595048904419, 0.000717848539352417, 0.0007760375738143921, 0.0008342266082763672, 0.0008924156427383423, 0.0009506046772003174, 0.0010087937116622925, 0.0010669827461242676, 0.0011251717805862427, 0.0011833608150482178, 0.0012415498495101929, 0.001299738883972168, 0.001357927918434143, 0.0014161169528961182, 0.0014743059873580933, 0.0015324950218200684, 0.0015906840562820435, 0.0016488730907440186, 0.0017070621252059937, 0.0017652511596679688]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 14.0, 9.0, 18.0, 21.0, 36.0, 50.0, 71.0, 74.0, 140.0, 181.0, 255.0, 381.0, 614.0, 916.0, 1443.0, 2330.0, 3794.0, 6541.0, 11643.0, 21174.0, 40724.0, 79475.0, 155702.0, 260167.0, 218421.0, 116056.0, 59127.0, 30324.0, 16422.0, 8824.0, 5213.0, 3032.0, 1810.0, 1263.0, 717.0, 491.0, 378.0, 223.0, 145.0, 103.0, 76.0, 57.0, 27.0, 31.0, 10.0, 7.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.03125, -15.492919921875, -14.95458984375, -14.416259765625, -13.8779296875, -13.339599609375, -12.80126953125, -12.262939453125, -11.724609375, -11.186279296875, -10.64794921875, -10.109619140625, -9.5712890625, -9.032958984375, -8.49462890625, -7.956298828125, -7.41796875, -6.879638671875, -6.34130859375, -5.802978515625, -5.2646484375, -4.726318359375, -4.18798828125, -3.649658203125, -3.111328125, -2.572998046875, -2.03466796875, -1.496337890625, -0.9580078125, -0.419677734375, 0.11865234375, 0.656982421875, 1.1953125, 1.733642578125, 2.27197265625, 2.810302734375, 3.3486328125, 3.886962890625, 4.42529296875, 4.963623046875, 5.501953125, 6.040283203125, 6.57861328125, 7.116943359375, 7.6552734375, 8.193603515625, 8.73193359375, 9.270263671875, 9.80859375, 10.346923828125, 10.88525390625, 11.423583984375, 11.9619140625, 12.500244140625, 13.03857421875, 13.576904296875, 14.115234375, 14.653564453125, 15.19189453125, 15.730224609375, 16.2685546875, 16.806884765625, 17.34521484375, 17.883544921875, 18.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 8.0, 4.0, 12.0, 20.0, 16.0, 28.0, 32.0, 32.0, 36.0, 48.0, 51.0, 45.0, 54.0, 64.0, 60.0, 53.0, 51.0, 69.0, 48.0, 32.0, 44.0, 35.0, 27.0, 16.0, 15.0, 17.0, 11.0, 9.0, 10.0, 4.0, 3.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.71875, -4.55792236328125, -4.3970947265625, -4.23626708984375, -4.075439453125, -3.91461181640625, -3.7537841796875, -3.59295654296875, -3.43212890625, -3.27130126953125, -3.1104736328125, -2.94964599609375, -2.788818359375, -2.62799072265625, -2.4671630859375, -2.30633544921875, -2.1455078125, -1.98468017578125, -1.8238525390625, -1.66302490234375, -1.502197265625, -1.34136962890625, -1.1805419921875, -1.01971435546875, -0.85888671875, -0.69805908203125, -0.5372314453125, -0.37640380859375, -0.215576171875, -0.05474853515625, 0.1060791015625, 0.26690673828125, 0.427734375, 0.58856201171875, 0.7493896484375, 0.91021728515625, 1.071044921875, 1.23187255859375, 1.3927001953125, 1.55352783203125, 1.71435546875, 1.87518310546875, 2.0360107421875, 2.19683837890625, 2.357666015625, 2.51849365234375, 2.6793212890625, 2.84014892578125, 3.0009765625, 3.16180419921875, 3.3226318359375, 3.48345947265625, 3.644287109375, 3.80511474609375, 3.9659423828125, 4.12677001953125, 4.28759765625, 4.44842529296875, 4.6092529296875, 4.77008056640625, 4.930908203125, 5.09173583984375, 5.2525634765625, 5.41339111328125, 5.57421875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 13.0, 12.0, 8.0, 15.0, 16.0, 20.0, 13.0, 17.0, 29.0, 38.0, 38.0, 47.0, 52.0, 56.0, 54.0, 70.0, 67.0, 62.0, 47.0, 52.0, 43.0, 34.0, 27.0, 35.0, 24.0, 13.0, 11.0, 19.0, 9.0, 10.0, 10.0, 6.0, 9.0, 4.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.63134765625, -29.641857147216797, -28.652366638183594, -27.66287612915039, -26.673383712768555, -25.68389320373535, -24.69440269470215, -23.704912185668945, -22.715421676635742, -21.72593116760254, -20.736440658569336, -19.7469482421875, -18.757457733154297, -17.767967224121094, -16.77847671508789, -15.788986206054688, -14.799494743347168, -13.810004234313965, -12.820512771606445, -11.831022262573242, -10.841531753540039, -9.852041244506836, -8.862549781799316, -7.873059272766113, -6.883568286895752, -5.894077301025391, -4.9045867919921875, -3.915095806121826, -2.925605058670044, -1.9361143112182617, -0.9466233253479004, 0.042867183685302734, 1.032358169555664, 2.0218489170074463, 3.0113396644592285, 4.00083065032959, 4.990321159362793, 5.979812145233154, 6.969303131103516, 7.958793640136719, 8.948284149169922, 9.937774658203125, 10.927266120910645, 11.916756629943848, 12.90624713897705, 13.89573860168457, 14.885229110717773, 15.874719619750977, 16.864212036132812, 17.853702545166016, 18.84319305419922, 19.832683563232422, 20.822175979614258, 21.81166648864746, 22.801156997680664, 23.790647506713867, 24.78013801574707, 25.769628524780273, 26.759119033813477, 27.748611450195312, 28.738101959228516, 29.72759246826172, 30.717082977294922, 31.706573486328125, 32.69606399536133]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 4.0, 4.0, 8.0, 10.0, 12.0, 8.0, 13.0, 13.0, 10.0, 22.0, 28.0, 22.0, 32.0, 31.0, 48.0, 33.0, 35.0, 34.0, 40.0, 39.0, 40.0, 33.0, 55.0, 57.0, 46.0, 39.0, 33.0, 36.0, 38.0, 36.0, 31.0, 18.0, 18.0, 14.0, 10.0, 12.0, 9.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.73298263549805, -31.6606388092041, -30.588294982910156, -29.51595115661621, -28.443607330322266, -27.371261596679688, -26.298917770385742, -25.226573944091797, -24.15423011779785, -23.081886291503906, -22.00954246520996, -20.937198638916016, -19.864852905273438, -18.792510986328125, -17.720165252685547, -16.6478214263916, -15.575477600097656, -14.503133773803711, -13.430789947509766, -12.358445167541504, -11.286101341247559, -10.213757514953613, -9.141412734985352, -8.069068908691406, -6.996725082397461, -5.924381256103516, -4.852036952972412, -3.7796928882598877, -2.7073488235473633, -1.635004997253418, -0.5626606941223145, 0.5096836090087891, 1.5820236206054688, 2.654367685317993, 3.7267117500305176, 4.799056053161621, 5.871399879455566, 6.943743705749512, 8.016088485717773, 9.088432312011719, 10.160776138305664, 11.23311996459961, 12.305463790893555, 13.377808570861816, 14.450152397155762, 15.522496223449707, 16.59484100341797, 17.667184829711914, 18.73952865600586, 19.811872482299805, 20.88421630859375, 21.956560134887695, 23.02890396118164, 24.10124969482422, 25.173593521118164, 26.24593734741211, 27.318281173706055, 28.390625, 29.462968826293945, 30.53531265258789, 31.60765838623047, 32.68000030517578, 33.75234603881836, 34.82469177246094, 35.89703369140625]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 15.0, 24.0, 33.0, 46.0, 60.0, 101.0, 154.0, 212.0, 353.0, 590.0, 992.0, 1719.0, 3071.0, 5870.0, 11618.0, 24885.0, 58800.0, 166852.0, 589452.0, 1646101.0, 1161127.0, 337742.0, 104979.0, 41353.0, 18563.0, 8848.0, 4577.0, 2613.0, 1398.0, 823.0, 472.0, 294.0, 195.0, 99.0, 84.0, 56.0, 29.0, 26.0, 13.0, 16.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-57.40625, -55.70703125, -54.0078125, -52.30859375, -50.609375, -48.91015625, -47.2109375, -45.51171875, -43.8125, -42.11328125, -40.4140625, -38.71484375, -37.015625, -35.31640625, -33.6171875, -31.91796875, -30.21875, -28.51953125, -26.8203125, -25.12109375, -23.421875, -21.72265625, -20.0234375, -18.32421875, -16.625, -14.92578125, -13.2265625, -11.52734375, -9.828125, -8.12890625, -6.4296875, -4.73046875, -3.03125, -1.33203125, 0.3671875, 2.06640625, 3.765625, 5.46484375, 7.1640625, 8.86328125, 10.5625, 12.26171875, 13.9609375, 15.66015625, 17.359375, 19.05859375, 20.7578125, 22.45703125, 24.15625, 25.85546875, 27.5546875, 29.25390625, 30.953125, 32.65234375, 34.3515625, 36.05078125, 37.75, 39.44921875, 41.1484375, 42.84765625, 44.546875, 46.24609375, 47.9453125, 49.64453125, 51.34375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 6.0, 0.0, 11.0, 8.0, 7.0, 8.0, 19.0, 10.0, 9.0, 12.0, 18.0, 27.0, 23.0, 40.0, 27.0, 42.0, 39.0, 31.0, 27.0, 40.0, 37.0, 41.0, 51.0, 46.0, 45.0, 50.0, 46.0, 43.0, 30.0, 38.0, 28.0, 27.0, 19.0, 21.0, 10.0, 9.0, 13.0, 13.0, 7.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.125, -32.139404296875, -31.15380859375, -30.168212890625, -29.1826171875, -28.197021484375, -27.21142578125, -26.225830078125, -25.240234375, -24.254638671875, -23.26904296875, -22.283447265625, -21.2978515625, -20.312255859375, -19.32666015625, -18.341064453125, -17.35546875, -16.369873046875, -15.38427734375, -14.398681640625, -13.4130859375, -12.427490234375, -11.44189453125, -10.456298828125, -9.470703125, -8.485107421875, -7.49951171875, -6.513916015625, -5.5283203125, -4.542724609375, -3.55712890625, -2.571533203125, -1.5859375, -0.600341796875, 0.38525390625, 1.370849609375, 2.3564453125, 3.342041015625, 4.32763671875, 5.313232421875, 6.298828125, 7.284423828125, 8.27001953125, 9.255615234375, 10.2412109375, 11.226806640625, 12.21240234375, 13.197998046875, 14.18359375, 15.169189453125, 16.15478515625, 17.140380859375, 18.1259765625, 19.111572265625, 20.09716796875, 21.082763671875, 22.068359375, 23.053955078125, 24.03955078125, 25.025146484375, 26.0107421875, 26.996337890625, 27.98193359375, 28.967529296875, 29.953125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [8.0, 1.0, 7.0, 7.0, 9.0, 15.0, 17.0, 31.0, 34.0, 43.0, 67.0, 105.0, 134.0, 203.0, 271.0, 402.0, 590.0, 872.0, 1246.0, 1838.0, 2822.0, 4430.0, 6847.0, 10856.0, 18845.0, 32495.0, 59437.0, 113174.0, 227545.0, 495106.0, 1081006.0, 1118286.0, 516599.0, 237300.0, 117548.0, 61606.0, 33627.0, 19206.0, 11211.0, 7161.0, 4420.0, 2855.0, 1839.0, 1217.0, 931.0, 597.0, 426.0, 274.0, 226.0, 159.0, 103.0, 61.0, 52.0, 50.0, 24.0, 20.0, 10.0, 10.0, 10.0, 8.0, 3.0, 1.0, 0.0, 1.0], "bins": [-41.375, -40.04150390625, -38.7080078125, -37.37451171875, -36.041015625, -34.70751953125, -33.3740234375, -32.04052734375, -30.70703125, -29.37353515625, -28.0400390625, -26.70654296875, -25.373046875, -24.03955078125, -22.7060546875, -21.37255859375, -20.0390625, -18.70556640625, -17.3720703125, -16.03857421875, -14.705078125, -13.37158203125, -12.0380859375, -10.70458984375, -9.37109375, -8.03759765625, -6.7041015625, -5.37060546875, -4.037109375, -2.70361328125, -1.3701171875, -0.03662109375, 1.296875, 2.63037109375, 3.9638671875, 5.29736328125, 6.630859375, 7.96435546875, 9.2978515625, 10.63134765625, 11.96484375, 13.29833984375, 14.6318359375, 15.96533203125, 17.298828125, 18.63232421875, 19.9658203125, 21.29931640625, 22.6328125, 23.96630859375, 25.2998046875, 26.63330078125, 27.966796875, 29.30029296875, 30.6337890625, 31.96728515625, 33.30078125, 34.63427734375, 35.9677734375, 37.30126953125, 38.634765625, 39.96826171875, 41.3017578125, 42.63525390625, 43.96875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 8.0, 6.0, 12.0, 9.0, 23.0, 18.0, 19.0, 35.0, 29.0, 54.0, 50.0, 78.0, 91.0, 90.0, 146.0, 166.0, 201.0, 275.0, 306.0, 310.0, 315.0, 304.0, 281.0, 245.0, 202.0, 162.0, 123.0, 109.0, 85.0, 72.0, 63.0, 39.0, 36.0, 16.0, 20.0, 13.0, 13.0, 6.0, 11.0, 8.0, 2.0, 6.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.203125, -13.72119140625, -13.2392578125, -12.75732421875, -12.275390625, -11.79345703125, -11.3115234375, -10.82958984375, -10.34765625, -9.86572265625, -9.3837890625, -8.90185546875, -8.419921875, -7.93798828125, -7.4560546875, -6.97412109375, -6.4921875, -6.01025390625, -5.5283203125, -5.04638671875, -4.564453125, -4.08251953125, -3.6005859375, -3.11865234375, -2.63671875, -2.15478515625, -1.6728515625, -1.19091796875, -0.708984375, -0.22705078125, 0.2548828125, 0.73681640625, 1.21875, 1.70068359375, 2.1826171875, 2.66455078125, 3.146484375, 3.62841796875, 4.1103515625, 4.59228515625, 5.07421875, 5.55615234375, 6.0380859375, 6.52001953125, 7.001953125, 7.48388671875, 7.9658203125, 8.44775390625, 8.9296875, 9.41162109375, 9.8935546875, 10.37548828125, 10.857421875, 11.33935546875, 11.8212890625, 12.30322265625, 12.78515625, 13.26708984375, 13.7490234375, 14.23095703125, 14.712890625, 15.19482421875, 15.6767578125, 16.15869140625, 16.640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 12.0, 12.0, 22.0, 26.0, 36.0, 45.0, 52.0, 57.0, 63.0, 70.0, 78.0, 78.0, 79.0, 59.0, 56.0, 54.0, 44.0, 27.0, 18.0, 21.0, 22.0, 16.0, 5.0, 12.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.362735748291016, -45.93781280517578, -44.51289367675781, -43.08797073364258, -41.663047790527344, -40.23812484741211, -38.81320571899414, -37.388282775878906, -35.96335983276367, -34.53843688964844, -33.11351776123047, -31.688594818115234, -30.263671875, -28.8387508392334, -27.413829803466797, -25.988906860351562, -24.56398582458496, -23.13906478881836, -21.714141845703125, -20.289220809936523, -18.86429786682129, -17.439376831054688, -16.014453887939453, -14.589532852172852, -13.164610862731934, -11.739688873291016, -10.314766883850098, -8.88984489440918, -7.46492338180542, -6.040001392364502, -4.615079879760742, -3.190157890319824, -1.7652359008789062, -0.34031403064727783, 1.0846078395843506, 2.5095295906066895, 3.9344515800476074, 5.359373569488525, 6.784295082092285, 8.209217071533203, 9.634139060974121, 11.059061050415039, 12.483983039855957, 13.908905029296875, 15.333826065063477, 16.75874900817871, 18.183670043945312, 19.608592987060547, 21.03351402282715, 22.45843505859375, 23.883358001708984, 25.308279037475586, 26.73320198059082, 28.158123016357422, 29.583045959472656, 31.007966995239258, 32.43288803100586, 33.857810974121094, 35.28273010253906, 36.7076530456543, 38.13257598876953, 39.557498931884766, 40.982418060302734, 42.40734100341797, 43.8322639465332]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 1.0, 3.0, 7.0, 15.0, 6.0, 10.0, 17.0, 14.0, 19.0, 25.0, 19.0, 32.0, 26.0, 16.0, 37.0, 33.0, 41.0, 47.0, 44.0, 51.0, 52.0, 38.0, 51.0, 43.0, 48.0, 51.0, 37.0, 35.0, 40.0, 24.0, 19.0, 25.0, 13.0, 9.0, 9.0, 10.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.490203857421875, -41.285099029541016, -40.079994201660156, -38.8748893737793, -37.66978454589844, -36.46467971801758, -35.25957489013672, -34.05447006225586, -32.849365234375, -31.64426040649414, -30.43915557861328, -29.234050750732422, -28.028945922851562, -26.823841094970703, -25.618736267089844, -24.413631439208984, -23.208526611328125, -22.003421783447266, -20.798316955566406, -19.593212127685547, -18.388107299804688, -17.183002471923828, -15.977897644042969, -14.77279281616211, -13.56768798828125, -12.36258316040039, -11.157478332519531, -9.952373504638672, -8.747268676757812, -7.542163848876953, -6.337059020996094, -5.131954193115234, -3.9268455505371094, -2.72174072265625, -1.5166358947753906, -0.31153106689453125, 0.8935737609863281, 2.0986785888671875, 3.303783416748047, 4.508888244628906, 5.713993072509766, 6.919097900390625, 8.124202728271484, 9.329307556152344, 10.534412384033203, 11.739517211914062, 12.944622039794922, 14.149726867675781, 15.35483169555664, 16.5599365234375, 17.76504135131836, 18.97014617919922, 20.175251007080078, 21.380355834960938, 22.585460662841797, 23.790565490722656, 24.995670318603516, 26.200775146484375, 27.405879974365234, 28.610984802246094, 29.816089630126953, 31.021194458007812, 32.22629928588867, 33.43140411376953, 34.63650894165039]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 20.0, 28.0, 42.0, 58.0, 74.0, 116.0, 193.0, 265.0, 448.0, 632.0, 1047.0, 1566.0, 2565.0, 4295.0, 7225.0, 12532.0, 22700.0, 42685.0, 86629.0, 182185.0, 297433.0, 193571.0, 91024.0, 44556.0, 23743.0, 13207.0, 7759.0, 4530.0, 2745.0, 1704.0, 1027.0, 675.0, 426.0, 298.0, 180.0, 125.0, 78.0, 38.0, 29.0, 34.0, 21.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-28.375, -27.553466796875, -26.73193359375, -25.910400390625, -25.0888671875, -24.267333984375, -23.44580078125, -22.624267578125, -21.802734375, -20.981201171875, -20.15966796875, -19.338134765625, -18.5166015625, -17.695068359375, -16.87353515625, -16.052001953125, -15.23046875, -14.408935546875, -13.58740234375, -12.765869140625, -11.9443359375, -11.122802734375, -10.30126953125, -9.479736328125, -8.658203125, -7.836669921875, -7.01513671875, -6.193603515625, -5.3720703125, -4.550537109375, -3.72900390625, -2.907470703125, -2.0859375, -1.264404296875, -0.44287109375, 0.378662109375, 1.2001953125, 2.021728515625, 2.84326171875, 3.664794921875, 4.486328125, 5.307861328125, 6.12939453125, 6.950927734375, 7.7724609375, 8.593994140625, 9.41552734375, 10.237060546875, 11.05859375, 11.880126953125, 12.70166015625, 13.523193359375, 14.3447265625, 15.166259765625, 15.98779296875, 16.809326171875, 17.630859375, 18.452392578125, 19.27392578125, 20.095458984375, 20.9169921875, 21.738525390625, 22.56005859375, 23.381591796875, 24.203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 5.0, 9.0, 9.0, 6.0, 11.0, 20.0, 12.0, 20.0, 15.0, 29.0, 21.0, 23.0, 28.0, 35.0, 44.0, 41.0, 49.0, 54.0, 51.0, 57.0, 50.0, 51.0, 49.0, 43.0, 42.0, 40.0, 40.0, 40.0, 21.0, 14.0, 17.0, 10.0, 13.0, 6.0, 9.0, 8.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.9375, -45.6298828125, -44.322265625, -43.0146484375, -41.70703125, -40.3994140625, -39.091796875, -37.7841796875, -36.4765625, -35.1689453125, -33.861328125, -32.5537109375, -31.24609375, -29.9384765625, -28.630859375, -27.3232421875, -26.015625, -24.7080078125, -23.400390625, -22.0927734375, -20.78515625, -19.4775390625, -18.169921875, -16.8623046875, -15.5546875, -14.2470703125, -12.939453125, -11.6318359375, -10.32421875, -9.0166015625, -7.708984375, -6.4013671875, -5.09375, -3.7861328125, -2.478515625, -1.1708984375, 0.13671875, 1.4443359375, 2.751953125, 4.0595703125, 5.3671875, 6.6748046875, 7.982421875, 9.2900390625, 10.59765625, 11.9052734375, 13.212890625, 14.5205078125, 15.828125, 17.1357421875, 18.443359375, 19.7509765625, 21.05859375, 22.3662109375, 23.673828125, 24.9814453125, 26.2890625, 27.5966796875, 28.904296875, 30.2119140625, 31.51953125, 32.8271484375, 34.134765625, 35.4423828125, 36.75]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 14.0, 15.0, 15.0, 24.0, 35.0, 47.0, 73.0, 117.0, 178.0, 289.0, 462.0, 669.0, 1086.0, 1746.0, 2724.0, 4756.0, 7998.0, 13618.0, 24344.0, 46730.0, 99934.0, 259997.0, 330142.0, 127810.0, 56989.0, 29092.0, 15981.0, 9347.0, 5484.0, 3316.0, 1995.0, 1311.0, 771.0, 468.0, 341.0, 235.0, 111.0, 100.0, 64.0, 41.0, 22.0, 19.0, 14.0, 7.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.6875, -32.56982421875, -31.4521484375, -30.33447265625, -29.216796875, -28.09912109375, -26.9814453125, -25.86376953125, -24.74609375, -23.62841796875, -22.5107421875, -21.39306640625, -20.275390625, -19.15771484375, -18.0400390625, -16.92236328125, -15.8046875, -14.68701171875, -13.5693359375, -12.45166015625, -11.333984375, -10.21630859375, -9.0986328125, -7.98095703125, -6.86328125, -5.74560546875, -4.6279296875, -3.51025390625, -2.392578125, -1.27490234375, -0.1572265625, 0.96044921875, 2.078125, 3.19580078125, 4.3134765625, 5.43115234375, 6.548828125, 7.66650390625, 8.7841796875, 9.90185546875, 11.01953125, 12.13720703125, 13.2548828125, 14.37255859375, 15.490234375, 16.60791015625, 17.7255859375, 18.84326171875, 19.9609375, 21.07861328125, 22.1962890625, 23.31396484375, 24.431640625, 25.54931640625, 26.6669921875, 27.78466796875, 28.90234375, 30.02001953125, 31.1376953125, 32.25537109375, 33.373046875, 34.49072265625, 35.6083984375, 36.72607421875, 37.84375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 8.0, 6.0, 6.0, 11.0, 15.0, 15.0, 16.0, 23.0, 20.0, 34.0, 28.0, 32.0, 36.0, 32.0, 39.0, 48.0, 41.0, 48.0, 51.0, 42.0, 58.0, 46.0, 35.0, 38.0, 33.0, 31.0, 22.0, 30.0, 26.0, 28.0, 18.0, 16.0, 16.0, 12.0, 16.0, 3.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.171875, -19.4619140625, -18.751953125, -18.0419921875, -17.33203125, -16.6220703125, -15.912109375, -15.2021484375, -14.4921875, -13.7822265625, -13.072265625, -12.3623046875, -11.65234375, -10.9423828125, -10.232421875, -9.5224609375, -8.8125, -8.1025390625, -7.392578125, -6.6826171875, -5.97265625, -5.2626953125, -4.552734375, -3.8427734375, -3.1328125, -2.4228515625, -1.712890625, -1.0029296875, -0.29296875, 0.4169921875, 1.126953125, 1.8369140625, 2.546875, 3.2568359375, 3.966796875, 4.6767578125, 5.38671875, 6.0966796875, 6.806640625, 7.5166015625, 8.2265625, 8.9365234375, 9.646484375, 10.3564453125, 11.06640625, 11.7763671875, 12.486328125, 13.1962890625, 13.90625, 14.6162109375, 15.326171875, 16.0361328125, 16.74609375, 17.4560546875, 18.166015625, 18.8759765625, 19.5859375, 20.2958984375, 21.005859375, 21.7158203125, 22.42578125, 23.1357421875, 23.845703125, 24.5556640625, 25.265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 12.0, 10.0, 16.0, 23.0, 40.0, 40.0, 76.0, 92.0, 131.0, 201.0, 278.0, 458.0, 586.0, 916.0, 1476.0, 2307.0, 3702.0, 6330.0, 11234.0, 20532.0, 40198.0, 82439.0, 173009.0, 296167.0, 206428.0, 98484.0, 47249.0, 24197.0, 13043.0, 7292.0, 4264.0, 2601.0, 1625.0, 1061.0, 642.0, 420.0, 303.0, 213.0, 136.0, 109.0, 50.0, 55.0, 31.0, 24.0, 13.0, 13.0, 9.0, 3.0, 2.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.77734375, -7.5389404296875, -7.300537109375, -7.0621337890625, -6.82373046875, -6.5853271484375, -6.346923828125, -6.1085205078125, -5.8701171875, -5.6317138671875, -5.393310546875, -5.1549072265625, -4.91650390625, -4.6781005859375, -4.439697265625, -4.2012939453125, -3.962890625, -3.7244873046875, -3.486083984375, -3.2476806640625, -3.00927734375, -2.7708740234375, -2.532470703125, -2.2940673828125, -2.0556640625, -1.8172607421875, -1.578857421875, -1.3404541015625, -1.10205078125, -0.8636474609375, -0.625244140625, -0.3868408203125, -0.1484375, 0.0899658203125, 0.328369140625, 0.5667724609375, 0.80517578125, 1.0435791015625, 1.281982421875, 1.5203857421875, 1.7587890625, 1.9971923828125, 2.235595703125, 2.4739990234375, 2.71240234375, 2.9508056640625, 3.189208984375, 3.4276123046875, 3.666015625, 3.9044189453125, 4.142822265625, 4.3812255859375, 4.61962890625, 4.8580322265625, 5.096435546875, 5.3348388671875, 5.5732421875, 5.8116455078125, 6.050048828125, 6.2884521484375, 6.52685546875, 6.7652587890625, 7.003662109375, 7.2420654296875, 7.48046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 11.0, 12.0, 11.0, 14.0, 19.0, 28.0, 30.0, 42.0, 41.0, 73.0, 73.0, 82.0, 90.0, 82.0, 61.0, 57.0, 46.0, 46.0, 41.0, 32.0, 29.0, 21.0, 20.0, 14.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010938644409179688, -0.001065678894519806, -0.001037493348121643, -0.0010093078017234802, -0.0009811222553253174, -0.0009529367089271545, -0.0009247511625289917, -0.0008965656161308289, -0.000868380069732666, -0.0008401945233345032, -0.0008120089769363403, -0.0007838234305381775, -0.0007556378841400146, -0.0007274523377418518, -0.000699266791343689, -0.0006710812449455261, -0.0006428956985473633, -0.0006147101521492004, -0.0005865246057510376, -0.0005583390593528748, -0.0005301535129547119, -0.0005019679665565491, -0.00047378242015838623, -0.0004455968737602234, -0.00041741132736206055, -0.0003892257809638977, -0.00036104023456573486, -0.000332854688167572, -0.0003046691417694092, -0.00027648359537124634, -0.0002482980489730835, -0.00022011250257492065, -0.0001919269561767578, -0.00016374140977859497, -0.00013555586338043213, -0.00010737031698226929, -7.918477058410645e-05, -5.0999224185943604e-05, -2.2813677787780762e-05, 5.37186861038208e-06, 3.355741500854492e-05, 6.174296140670776e-05, 8.99285078048706e-05, 0.00011811405420303345, 0.0001462996006011963, 0.00017448514699935913, 0.00020267069339752197, 0.00023085623979568481, 0.00025904178619384766, 0.0002872273325920105, 0.00031541287899017334, 0.0003435984253883362, 0.000371783971786499, 0.00039996951818466187, 0.0004281550645828247, 0.00045634061098098755, 0.0004845261573791504, 0.0005127117037773132, 0.0005408972501754761, 0.0005690827965736389, 0.0005972683429718018, 0.0006254538893699646, 0.0006536394357681274, 0.0006818249821662903, 0.0007100105285644531]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 14.0, 14.0, 23.0, 19.0, 45.0, 72.0, 89.0, 134.0, 161.0, 257.0, 382.0, 655.0, 1031.0, 1725.0, 2881.0, 5142.0, 9570.0, 18481.0, 37291.0, 78460.0, 166162.0, 288396.0, 223825.0, 108538.0, 51595.0, 24784.0, 12699.0, 6661.0, 3698.0, 2171.0, 1291.0, 786.0, 525.0, 333.0, 206.0, 136.0, 96.0, 52.0, 34.0, 38.0, 19.0, 18.0, 6.0, 15.0, 4.0, 3.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0], "bins": [-10.203125, -9.9005126953125, -9.597900390625, -9.2952880859375, -8.99267578125, -8.6900634765625, -8.387451171875, -8.0848388671875, -7.7822265625, -7.4796142578125, -7.177001953125, -6.8743896484375, -6.57177734375, -6.2691650390625, -5.966552734375, -5.6639404296875, -5.361328125, -5.0587158203125, -4.756103515625, -4.4534912109375, -4.15087890625, -3.8482666015625, -3.545654296875, -3.2430419921875, -2.9404296875, -2.6378173828125, -2.335205078125, -2.0325927734375, -1.72998046875, -1.4273681640625, -1.124755859375, -0.8221435546875, -0.51953125, -0.2169189453125, 0.085693359375, 0.3883056640625, 0.69091796875, 0.9935302734375, 1.296142578125, 1.5987548828125, 1.9013671875, 2.2039794921875, 2.506591796875, 2.8092041015625, 3.11181640625, 3.4144287109375, 3.717041015625, 4.0196533203125, 4.322265625, 4.6248779296875, 4.927490234375, 5.2301025390625, 5.53271484375, 5.8353271484375, 6.137939453125, 6.4405517578125, 6.7431640625, 7.0457763671875, 7.348388671875, 7.6510009765625, 7.95361328125, 8.2562255859375, 8.558837890625, 8.8614501953125, 9.1640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 12.0, 10.0, 10.0, 16.0, 14.0, 27.0, 26.0, 31.0, 42.0, 58.0, 62.0, 80.0, 61.0, 76.0, 76.0, 66.0, 69.0, 48.0, 35.0, 37.0, 21.0, 18.0, 18.0, 15.0, 10.0, 7.0, 5.0, 12.0, 4.0, 5.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.9453125, -2.859100341796875, -2.77288818359375, -2.686676025390625, -2.6004638671875, -2.514251708984375, -2.42803955078125, -2.341827392578125, -2.255615234375, -2.169403076171875, -2.08319091796875, -1.996978759765625, -1.9107666015625, -1.824554443359375, -1.73834228515625, -1.652130126953125, -1.56591796875, -1.479705810546875, -1.39349365234375, -1.307281494140625, -1.2210693359375, -1.134857177734375, -1.04864501953125, -0.962432861328125, -0.876220703125, -0.790008544921875, -0.70379638671875, -0.617584228515625, -0.5313720703125, -0.445159912109375, -0.35894775390625, -0.272735595703125, -0.1865234375, -0.100311279296875, -0.01409912109375, 0.072113037109375, 0.1583251953125, 0.244537353515625, 0.33074951171875, 0.416961669921875, 0.503173828125, 0.589385986328125, 0.67559814453125, 0.761810302734375, 0.8480224609375, 0.934234619140625, 1.02044677734375, 1.106658935546875, 1.19287109375, 1.279083251953125, 1.36529541015625, 1.451507568359375, 1.5377197265625, 1.623931884765625, 1.71014404296875, 1.796356201171875, 1.882568359375, 1.968780517578125, 2.05499267578125, 2.141204833984375, 2.2274169921875, 2.313629150390625, 2.39984130859375, 2.486053466796875, 2.572265625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 11.0, 17.0, 14.0, 25.0, 30.0, 45.0, 44.0, 64.0, 61.0, 60.0, 75.0, 83.0, 80.0, 67.0, 57.0, 61.0, 44.0, 27.0, 28.0, 20.0, 16.0, 16.0, 12.0, 6.0, 8.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.283668518066406, -45.869693756103516, -44.455718994140625, -43.04174041748047, -41.62776565551758, -40.21379089355469, -38.79981231689453, -37.38583755493164, -35.97186279296875, -34.55788803100586, -33.14391326904297, -31.729934692382812, -30.315959930419922, -28.90198516845703, -27.488008499145508, -26.074031829833984, -24.660057067871094, -23.246082305908203, -21.83210563659668, -20.418128967285156, -19.004154205322266, -17.590179443359375, -16.17620277404785, -14.762227058410645, -13.348251342773438, -11.93427562713623, -10.520299911499023, -9.106324195861816, -7.692348480224609, -6.278372764587402, -4.864397048950195, -3.4504213333129883, -2.0364456176757812, -0.6224699020385742, 0.7915058135986328, 2.20548152923584, 3.619457244873047, 5.033432960510254, 6.447408676147461, 7.861384391784668, 9.275360107421875, 10.689335823059082, 12.103311538696289, 13.517287254333496, 14.931262969970703, 16.345237731933594, 17.759214401245117, 19.17319107055664, 20.58716583251953, 22.001140594482422, 23.415117263793945, 24.82909393310547, 26.24306869506836, 27.65704345703125, 29.071020126342773, 30.484996795654297, 31.898971557617188, 33.31294631958008, 34.72692108154297, 36.140899658203125, 37.554874420166016, 38.968849182128906, 40.38282775878906, 41.79680252075195, 43.210777282714844]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 14.0, 8.0, 12.0, 13.0, 14.0, 14.0, 26.0, 19.0, 28.0, 31.0, 20.0, 28.0, 31.0, 43.0, 47.0, 42.0, 49.0, 50.0, 43.0, 48.0, 43.0, 48.0, 52.0, 34.0, 41.0, 42.0, 28.0, 23.0, 22.0, 16.0, 10.0, 10.0, 8.0, 14.0, 11.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-42.58190155029297, -41.38736343383789, -40.19282531738281, -38.998291015625, -37.80375289916992, -36.609214782714844, -35.41468048095703, -34.22014236450195, -33.025604248046875, -31.831066131591797, -30.63652992248535, -29.441993713378906, -28.247455596923828, -27.05291748046875, -25.858381271362305, -24.66384506225586, -23.46930694580078, -22.274768829345703, -21.080232620239258, -19.885696411132812, -18.691158294677734, -17.496620178222656, -16.30208396911621, -15.10754680633545, -13.913009643554688, -12.718472480773926, -11.523935317993164, -10.329398155212402, -9.13486099243164, -7.940323829650879, -6.745786666870117, -5.5512495040893555, -4.356708526611328, -3.1621713638305664, -1.9676342010498047, -0.773097038269043, 0.42144012451171875, 1.6159772872924805, 2.810514450073242, 4.005051612854004, 5.199588775634766, 6.394125938415527, 7.588663101196289, 8.78320026397705, 9.977737426757812, 11.172274589538574, 12.366811752319336, 13.561348915100098, 14.75588607788086, 15.950423240661621, 17.144960403442383, 18.339496612548828, 19.534034729003906, 20.728572845458984, 21.92310905456543, 23.117645263671875, 24.312183380126953, 25.50672149658203, 26.701257705688477, 27.895793914794922, 29.09033203125, 30.284870147705078, 31.479406356811523, 32.67394256591797, 33.86848068237305]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 7.0, 23.0, 37.0, 34.0, 59.0, 95.0, 154.0, 230.0, 341.0, 556.0, 829.0, 1411.0, 2186.0, 3465.0, 5566.0, 8891.0, 14905.0, 23717.0, 38754.0, 63073.0, 101748.0, 157298.0, 198170.0, 158873.0, 102970.0, 63138.0, 38982.0, 24053.0, 14761.0, 8999.0, 5566.0, 3528.0, 2278.0, 1406.0, 875.0, 580.0, 340.0, 237.0, 157.0, 80.0, 54.0, 48.0, 17.0, 22.0, 13.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-38.96875, -37.73193359375, -36.4951171875, -35.25830078125, -34.021484375, -32.78466796875, -31.5478515625, -30.31103515625, -29.07421875, -27.83740234375, -26.6005859375, -25.36376953125, -24.126953125, -22.89013671875, -21.6533203125, -20.41650390625, -19.1796875, -17.94287109375, -16.7060546875, -15.46923828125, -14.232421875, -12.99560546875, -11.7587890625, -10.52197265625, -9.28515625, -8.04833984375, -6.8115234375, -5.57470703125, -4.337890625, -3.10107421875, -1.8642578125, -0.62744140625, 0.609375, 1.84619140625, 3.0830078125, 4.31982421875, 5.556640625, 6.79345703125, 8.0302734375, 9.26708984375, 10.50390625, 11.74072265625, 12.9775390625, 14.21435546875, 15.451171875, 16.68798828125, 17.9248046875, 19.16162109375, 20.3984375, 21.63525390625, 22.8720703125, 24.10888671875, 25.345703125, 26.58251953125, 27.8193359375, 29.05615234375, 30.29296875, 31.52978515625, 32.7666015625, 34.00341796875, 35.240234375, 36.47705078125, 37.7138671875, 38.95068359375, 40.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 1.0, 7.0, 6.0, 9.0, 13.0, 14.0, 8.0, 15.0, 19.0, 26.0, 19.0, 25.0, 20.0, 32.0, 37.0, 30.0, 49.0, 55.0, 49.0, 52.0, 49.0, 49.0, 50.0, 60.0, 47.0, 34.0, 45.0, 39.0, 31.0, 27.0, 13.0, 13.0, 11.0, 11.0, 10.0, 7.0, 7.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.21875, -42.01171875, -40.8046875, -39.59765625, -38.390625, -37.18359375, -35.9765625, -34.76953125, -33.5625, -32.35546875, -31.1484375, -29.94140625, -28.734375, -27.52734375, -26.3203125, -25.11328125, -23.90625, -22.69921875, -21.4921875, -20.28515625, -19.078125, -17.87109375, -16.6640625, -15.45703125, -14.25, -13.04296875, -11.8359375, -10.62890625, -9.421875, -8.21484375, -7.0078125, -5.80078125, -4.59375, -3.38671875, -2.1796875, -0.97265625, 0.234375, 1.44140625, 2.6484375, 3.85546875, 5.0625, 6.26953125, 7.4765625, 8.68359375, 9.890625, 11.09765625, 12.3046875, 13.51171875, 14.71875, 15.92578125, 17.1328125, 18.33984375, 19.546875, 20.75390625, 21.9609375, 23.16796875, 24.375, 25.58203125, 26.7890625, 27.99609375, 29.203125, 30.41015625, 31.6171875, 32.82421875, 34.03125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 10.0, 13.0, 25.0, 22.0, 31.0, 44.0, 88.0, 124.0, 192.0, 256.0, 409.0, 633.0, 920.0, 1411.0, 2037.0, 3102.0, 4774.0, 7116.0, 10917.0, 16508.0, 25070.0, 38595.0, 58686.0, 88533.0, 129064.0, 166779.0, 155948.0, 114212.0, 76289.0, 50302.0, 33135.0, 21554.0, 14195.0, 9385.0, 6187.0, 4055.0, 2674.0, 1727.0, 1195.0, 780.0, 499.0, 343.0, 237.0, 144.0, 111.0, 79.0, 48.0, 36.0, 25.0, 11.0, 11.0, 11.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.25, -34.02685546875, -32.8037109375, -31.58056640625, -30.357421875, -29.13427734375, -27.9111328125, -26.68798828125, -25.46484375, -24.24169921875, -23.0185546875, -21.79541015625, -20.572265625, -19.34912109375, -18.1259765625, -16.90283203125, -15.6796875, -14.45654296875, -13.2333984375, -12.01025390625, -10.787109375, -9.56396484375, -8.3408203125, -7.11767578125, -5.89453125, -4.67138671875, -3.4482421875, -2.22509765625, -1.001953125, 0.22119140625, 1.4443359375, 2.66748046875, 3.890625, 5.11376953125, 6.3369140625, 7.56005859375, 8.783203125, 10.00634765625, 11.2294921875, 12.45263671875, 13.67578125, 14.89892578125, 16.1220703125, 17.34521484375, 18.568359375, 19.79150390625, 21.0146484375, 22.23779296875, 23.4609375, 24.68408203125, 25.9072265625, 27.13037109375, 28.353515625, 29.57666015625, 30.7998046875, 32.02294921875, 33.24609375, 34.46923828125, 35.6923828125, 36.91552734375, 38.138671875, 39.36181640625, 40.5849609375, 41.80810546875, 43.03125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 14.0, 10.0, 8.0, 11.0, 8.0, 15.0, 22.0, 19.0, 11.0, 27.0, 24.0, 23.0, 29.0, 39.0, 31.0, 37.0, 24.0, 37.0, 26.0, 43.0, 42.0, 38.0, 32.0, 36.0, 34.0, 47.0, 30.0, 26.0, 37.0, 22.0, 28.0, 20.0, 20.0, 18.0, 23.0, 14.0, 16.0, 7.0, 12.0, 8.0, 9.0, 2.0, 4.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.709228515625, -18.05908203125, -17.408935546875, -16.7587890625, -16.108642578125, -15.45849609375, -14.808349609375, -14.158203125, -13.508056640625, -12.85791015625, -12.207763671875, -11.5576171875, -10.907470703125, -10.25732421875, -9.607177734375, -8.95703125, -8.306884765625, -7.65673828125, -7.006591796875, -6.3564453125, -5.706298828125, -5.05615234375, -4.406005859375, -3.755859375, -3.105712890625, -2.45556640625, -1.805419921875, -1.1552734375, -0.505126953125, 0.14501953125, 0.795166015625, 1.4453125, 2.095458984375, 2.74560546875, 3.395751953125, 4.0458984375, 4.696044921875, 5.34619140625, 5.996337890625, 6.646484375, 7.296630859375, 7.94677734375, 8.596923828125, 9.2470703125, 9.897216796875, 10.54736328125, 11.197509765625, 11.84765625, 12.497802734375, 13.14794921875, 13.798095703125, 14.4482421875, 15.098388671875, 15.74853515625, 16.398681640625, 17.048828125, 17.698974609375, 18.34912109375, 18.999267578125, 19.6494140625, 20.299560546875, 20.94970703125, 21.599853515625, 22.25]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 8.0, 14.0, 34.0, 35.0, 64.0, 65.0, 83.0, 159.0, 243.0, 344.0, 506.0, 822.0, 1317.0, 2163.0, 3585.0, 6398.0, 11480.0, 21717.0, 42286.0, 87756.0, 184611.0, 287426.0, 200708.0, 97234.0, 46716.0, 23570.0, 12483.0, 6785.0, 3790.0, 2283.0, 1388.0, 841.0, 535.0, 342.0, 255.0, 173.0, 99.0, 69.0, 52.0, 43.0, 21.0, 8.0, 9.0, 15.0, 4.0, 4.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-24.78125, -24.020263671875, -23.25927734375, -22.498291015625, -21.7373046875, -20.976318359375, -20.21533203125, -19.454345703125, -18.693359375, -17.932373046875, -17.17138671875, -16.410400390625, -15.6494140625, -14.888427734375, -14.12744140625, -13.366455078125, -12.60546875, -11.844482421875, -11.08349609375, -10.322509765625, -9.5615234375, -8.800537109375, -8.03955078125, -7.278564453125, -6.517578125, -5.756591796875, -4.99560546875, -4.234619140625, -3.4736328125, -2.712646484375, -1.95166015625, -1.190673828125, -0.4296875, 0.331298828125, 1.09228515625, 1.853271484375, 2.6142578125, 3.375244140625, 4.13623046875, 4.897216796875, 5.658203125, 6.419189453125, 7.18017578125, 7.941162109375, 8.7021484375, 9.463134765625, 10.22412109375, 10.985107421875, 11.74609375, 12.507080078125, 13.26806640625, 14.029052734375, 14.7900390625, 15.551025390625, 16.31201171875, 17.072998046875, 17.833984375, 18.594970703125, 19.35595703125, 20.116943359375, 20.8779296875, 21.638916015625, 22.39990234375, 23.160888671875, 23.921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 6.0, 5.0, 9.0, 13.0, 8.0, 18.0, 23.0, 34.0, 33.0, 45.0, 54.0, 72.0, 81.0, 94.0, 117.0, 83.0, 72.0, 59.0, 52.0, 34.0, 22.0, 15.0, 16.0, 6.0, 10.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028076171875, -0.0027250945568084717, -0.0026425719261169434, -0.002560049295425415, -0.0024775266647338867, -0.0023950040340423584, -0.00231248140335083, -0.0022299587726593018, -0.0021474361419677734, -0.002064913511276245, -0.001982390880584717, -0.0018998682498931885, -0.0018173456192016602, -0.0017348229885101318, -0.0016523003578186035, -0.0015697777271270752, -0.0014872550964355469, -0.0014047324657440186, -0.0013222098350524902, -0.001239687204360962, -0.0011571645736694336, -0.0010746419429779053, -0.000992119312286377, -0.0009095966815948486, -0.0008270740509033203, -0.000744551420211792, -0.0006620287895202637, -0.0005795061588287354, -0.000496983528137207, -0.0004144608974456787, -0.0003319382667541504, -0.00024941563606262207, -0.00016689300537109375, -8.437037467956543e-05, -1.8477439880371094e-06, 8.067488670349121e-05, 0.00016319751739501953, 0.00024572014808654785, 0.00032824277877807617, 0.0004107654094696045, 0.0004932880401611328, 0.0005758106708526611, 0.0006583333015441895, 0.0007408559322357178, 0.0008233785629272461, 0.0009059011936187744, 0.0009884238243103027, 0.001070946455001831, 0.0011534690856933594, 0.0012359917163848877, 0.001318514347076416, 0.0014010369777679443, 0.0014835596084594727, 0.001566082239151001, 0.0016486048698425293, 0.0017311275005340576, 0.001813650131225586, 0.0018961727619171143, 0.0019786953926086426, 0.002061218023300171, 0.0021437406539916992, 0.0022262632846832275, 0.002308785915374756, 0.002391308546066284, 0.0024738311767578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 4.0, 5.0, 5.0, 18.0, 26.0, 31.0, 41.0, 79.0, 73.0, 150.0, 200.0, 346.0, 512.0, 855.0, 1462.0, 2249.0, 3954.0, 6690.0, 11593.0, 21262.0, 39563.0, 74866.0, 141246.0, 237694.0, 224822.0, 130174.0, 68629.0, 36377.0, 19419.0, 10850.0, 6092.0, 3548.0, 2132.0, 1308.0, 795.0, 520.0, 339.0, 195.0, 137.0, 86.0, 56.0, 53.0, 28.0, 17.0, 17.0, 7.0, 8.0, 3.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.25, -20.56298828125, -19.8759765625, -19.18896484375, -18.501953125, -17.81494140625, -17.1279296875, -16.44091796875, -15.75390625, -15.06689453125, -14.3798828125, -13.69287109375, -13.005859375, -12.31884765625, -11.6318359375, -10.94482421875, -10.2578125, -9.57080078125, -8.8837890625, -8.19677734375, -7.509765625, -6.82275390625, -6.1357421875, -5.44873046875, -4.76171875, -4.07470703125, -3.3876953125, -2.70068359375, -2.013671875, -1.32666015625, -0.6396484375, 0.04736328125, 0.734375, 1.42138671875, 2.1083984375, 2.79541015625, 3.482421875, 4.16943359375, 4.8564453125, 5.54345703125, 6.23046875, 6.91748046875, 7.6044921875, 8.29150390625, 8.978515625, 9.66552734375, 10.3525390625, 11.03955078125, 11.7265625, 12.41357421875, 13.1005859375, 13.78759765625, 14.474609375, 15.16162109375, 15.8486328125, 16.53564453125, 17.22265625, 17.90966796875, 18.5966796875, 19.28369140625, 19.970703125, 20.65771484375, 21.3447265625, 22.03173828125, 22.71875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 4.0, 4.0, 8.0, 13.0, 14.0, 17.0, 17.0, 33.0, 34.0, 33.0, 40.0, 39.0, 48.0, 47.0, 50.0, 66.0, 52.0, 68.0, 64.0, 52.0, 47.0, 37.0, 32.0, 25.0, 31.0, 31.0, 11.0, 21.0, 12.0, 10.0, 11.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.46728515625, -7.2509765625, -7.03466796875, -6.818359375, -6.60205078125, -6.3857421875, -6.16943359375, -5.953125, -5.73681640625, -5.5205078125, -5.30419921875, -5.087890625, -4.87158203125, -4.6552734375, -4.43896484375, -4.22265625, -4.00634765625, -3.7900390625, -3.57373046875, -3.357421875, -3.14111328125, -2.9248046875, -2.70849609375, -2.4921875, -2.27587890625, -2.0595703125, -1.84326171875, -1.626953125, -1.41064453125, -1.1943359375, -0.97802734375, -0.76171875, -0.54541015625, -0.3291015625, -0.11279296875, 0.103515625, 0.31982421875, 0.5361328125, 0.75244140625, 0.96875, 1.18505859375, 1.4013671875, 1.61767578125, 1.833984375, 2.05029296875, 2.2666015625, 2.48291015625, 2.69921875, 2.91552734375, 3.1318359375, 3.34814453125, 3.564453125, 3.78076171875, 3.9970703125, 4.21337890625, 4.4296875, 4.64599609375, 4.8623046875, 5.07861328125, 5.294921875, 5.51123046875, 5.7275390625, 5.94384765625, 6.16015625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 7.0, 5.0, 9.0, 9.0, 15.0, 19.0, 15.0, 22.0, 25.0, 32.0, 50.0, 40.0, 56.0, 58.0, 68.0, 58.0, 57.0, 62.0, 64.0, 59.0, 37.0, 40.0, 47.0, 17.0, 21.0, 22.0, 20.0, 15.0, 12.0, 7.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.43230438232422, -41.18538284301758, -39.93846130371094, -38.6915397644043, -37.444618225097656, -36.197696685791016, -34.950775146484375, -33.703853607177734, -32.456932067871094, -31.210010528564453, -29.963088989257812, -28.716167449951172, -27.46924591064453, -26.22232437133789, -24.97540283203125, -23.72848129272461, -22.481557846069336, -21.234636306762695, -19.987714767456055, -18.740793228149414, -17.493871688842773, -16.246950149536133, -15.000027656555176, -13.753106117248535, -12.506184577941895, -11.259263038635254, -10.012341499328613, -8.765419006347656, -7.518497943878174, -6.271576404571533, -5.024654388427734, -3.7777328491210938, -2.530811309814453, -1.283889651298523, -0.03696799278259277, 1.209953784942627, 2.4568753242492676, 3.703796863555908, 4.950718879699707, 6.197640419006348, 7.444561958312988, 8.691483497619629, 9.93840503692627, 11.185327529907227, 12.432249069213867, 13.679170608520508, 14.926092147827148, 16.17301368713379, 17.41993522644043, 18.66685676574707, 19.91377830505371, 21.16069984436035, 22.407621383666992, 23.654542922973633, 24.901466369628906, 26.148387908935547, 27.395309448242188, 28.642230987548828, 29.88915252685547, 31.13607406616211, 32.38299560546875, 33.62991714477539, 34.87683868408203, 36.12376022338867, 37.37068176269531]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 9.0, 6.0, 10.0, 9.0, 13.0, 9.0, 13.0, 19.0, 25.0, 22.0, 30.0, 34.0, 34.0, 31.0, 47.0, 32.0, 52.0, 43.0, 44.0, 44.0, 39.0, 52.0, 42.0, 42.0, 47.0, 44.0, 38.0, 28.0, 26.0, 19.0, 23.0, 16.0, 14.0, 12.0, 14.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.439571380615234, -45.023658752441406, -43.607749938964844, -42.191837310791016, -40.77592468261719, -39.360015869140625, -37.9441032409668, -36.52819061279297, -35.112281799316406, -33.69636917114258, -32.280460357666016, -30.864547729492188, -29.448637008666992, -28.032726287841797, -26.61681365966797, -25.200902938842773, -23.784992218017578, -22.369081497192383, -20.953170776367188, -19.53725814819336, -18.121347427368164, -16.70543670654297, -15.289525032043457, -13.873613357543945, -12.45770263671875, -11.041791915893555, -9.625880241394043, -8.209968566894531, -6.794057846069336, -5.378146648406982, -3.962235450744629, -2.546323776245117, -1.1304092407226562, 0.28550195693969727, 1.7014131546020508, 3.1173243522644043, 4.533235549926758, 5.949146747589111, 7.365057945251465, 8.780969619750977, 10.196880340576172, 11.612791061401367, 13.028702735900879, 14.44461441040039, 15.860525131225586, 17.27643585205078, 18.69234848022461, 20.108259201049805, 21.524169921875, 22.940080642700195, 24.35599136352539, 25.77190399169922, 27.187814712524414, 28.60372543334961, 30.019638061523438, 31.435548782348633, 32.85145950317383, 34.267372131347656, 35.68328094482422, 37.09919357299805, 38.515106201171875, 39.93101501464844, 41.346927642822266, 42.762840270996094, 44.178749084472656]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 11.0, 8.0, 14.0, 17.0, 17.0, 21.0, 32.0, 45.0, 56.0, 64.0, 85.0, 127.0, 163.0, 233.0, 304.0, 419.0, 671.0, 874.0, 1043125.0, 1167.0, 856.0, 648.0, 462.0, 319.0, 198.0, 166.0, 129.0, 78.0, 62.0, 51.0, 48.0, 27.0, 26.0, 20.0, 8.0, 11.0, 11.0, 7.0, 7.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-885.319091796875, -860.0007934570312, -834.6824951171875, -809.3641967773438, -784.0458984375, -758.7276000976562, -733.4093017578125, -708.0910034179688, -682.772705078125, -657.4544067382812, -632.1361083984375, -606.8178100585938, -581.49951171875, -556.1812133789062, -530.8629150390625, -505.54461669921875, -480.2263488769531, -454.9080505371094, -429.5897521972656, -404.2714538574219, -378.9531555175781, -353.6348571777344, -328.31658935546875, -302.998291015625, -277.67999267578125, -252.3616943359375, -227.04339599609375, -201.72509765625, -176.40679931640625, -151.0885009765625, -125.77021789550781, -100.45191955566406, -75.13360595703125, -49.8153076171875, -24.497013092041016, 0.8212814331054688, 26.13957977294922, 51.45787811279297, 76.77616882324219, 102.09446716308594, 127.41276550292969, 152.73106384277344, 178.0493621826172, 203.36764526367188, 228.68594360351562, 254.00424194335938, 279.3225402832031, 304.6408386230469, 329.9591369628906, 355.2774353027344, 380.5957336425781, 405.9140319824219, 431.2323303222656, 456.5506286621094, 481.868896484375, 507.18719482421875, 532.5054931640625, 557.8237915039062, 583.14208984375, 608.4603881835938, 633.7786865234375, 659.0969848632812, 684.415283203125, 709.7335815429688, 735.0518798828125]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 2.0, 10.0, 9.0, 14.0, 18.0, 23.0, 26.0, 23.0, 23.0, 39.0, 52.0, 62.0, 81.0, 110.0, 130.0, 168.0, 238.0, 413.0, 1584.0, 51458464.0, 7699.0, 902.0, 325.0, 202.0, 149.0, 115.0, 95.0, 74.0, 60.0, 47.0, 29.0, 26.0, 22.0, 22.0, 14.0, 16.0, 12.0, 14.0, 8.0, 7.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3355.04296875, -3238.647705078125, -3122.25244140625, -3005.857177734375, -2889.4619140625, -2773.066650390625, -2656.67138671875, -2540.276123046875, -2423.880859375, -2307.485595703125, -2191.09033203125, -2074.695068359375, -1958.2998046875, -1841.904541015625, -1725.50927734375, -1609.114013671875, -1492.71875, -1376.323486328125, -1259.92822265625, -1143.532958984375, -1027.1376953125, -910.742431640625, -794.34716796875, -677.951904296875, -561.556640625, -445.161376953125, -328.76611328125, -212.370849609375, -95.9755859375, 20.419677734375, 136.81494140625, 253.210205078125, 369.605712890625, 486.0009765625, 602.396240234375, 718.79150390625, 835.186767578125, 951.58203125, 1067.977294921875, 1184.37255859375, 1300.767822265625, 1417.1630859375, 1533.558349609375, 1649.95361328125, 1766.348876953125, 1882.744140625, 1999.139404296875, 2115.53466796875, 2231.929931640625, 2348.3251953125, 2464.720458984375, 2581.11572265625, 2697.510986328125, 2813.90625, 2930.301513671875, 3046.69677734375, 3163.092041015625, 3279.4873046875, 3395.882568359375, 3512.27783203125, 3628.673095703125, 3745.068359375, 3861.463623046875, 3977.85888671875, 4094.254150390625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 9.0, 13.0, 13.0, 21.0, 54.0, 67.0, 111.0, 205.0, 375.0, 647.0, 1167.0, 2128.0, 3966.0, 8101.0, 16808.0, 35378.0, 79686.0, 192082.0, 522875.0, 1990817.0, 2437926.0, 612143.0, 218663.0, 90331.0, 40360.0, 18642.0, 9076.0, 4563.0, 2370.0, 1208.0, 698.0, 373.0, 208.0, 122.0, 84.0, 54.0, 36.0, 18.0, 21.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-162.375, -157.8740234375, -153.373046875, -148.8720703125, -144.37109375, -139.8701171875, -135.369140625, -130.8681640625, -126.3671875, -121.8662109375, -117.365234375, -112.8642578125, -108.36328125, -103.8623046875, -99.361328125, -94.8603515625, -90.359375, -85.8583984375, -81.357421875, -76.8564453125, -72.35546875, -67.8544921875, -63.353515625, -58.8525390625, -54.3515625, -49.8505859375, -45.349609375, -40.8486328125, -36.34765625, -31.8466796875, -27.345703125, -22.8447265625, -18.34375, -13.8427734375, -9.341796875, -4.8408203125, -0.33984375, 4.1611328125, 8.662109375, 13.1630859375, 17.6640625, 22.1650390625, 26.666015625, 31.1669921875, 35.66796875, 40.1689453125, 44.669921875, 49.1708984375, 53.671875, 58.1728515625, 62.673828125, 67.1748046875, 71.67578125, 76.1767578125, 80.677734375, 85.1787109375, 89.6796875, 94.1806640625, 98.681640625, 103.1826171875, 107.68359375, 112.1845703125, 116.685546875, 121.1865234375, 125.6875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 2.0, 6.0, 9.0, 15.0, 13.0, 13.0, 15.0, 18.0, 18.0, 18.0, 34.0, 40.0, 39.0, 50.0, 72.0, 97.0, 120.0, 162.0, 181.0, 212.0, 161.0, 155.0, 112.0, 93.0, 60.0, 43.0, 45.0, 33.0, 30.0, 31.0, 21.0, 14.0, 8.0, 14.0, 13.0, 8.0, 6.0, 12.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.4375, -61.3486328125, -59.259765625, -57.1708984375, -55.08203125, -52.9931640625, -50.904296875, -48.8154296875, -46.7265625, -44.6376953125, -42.548828125, -40.4599609375, -38.37109375, -36.2822265625, -34.193359375, -32.1044921875, -30.015625, -27.9267578125, -25.837890625, -23.7490234375, -21.66015625, -19.5712890625, -17.482421875, -15.3935546875, -13.3046875, -11.2158203125, -9.126953125, -7.0380859375, -4.94921875, -2.8603515625, -0.771484375, 1.3173828125, 3.40625, 5.4951171875, 7.583984375, 9.6728515625, 11.76171875, 13.8505859375, 15.939453125, 18.0283203125, 20.1171875, 22.2060546875, 24.294921875, 26.3837890625, 28.47265625, 30.5615234375, 32.650390625, 34.7392578125, 36.828125, 38.9169921875, 41.005859375, 43.0947265625, 45.18359375, 47.2724609375, 49.361328125, 51.4501953125, 53.5390625, 55.6279296875, 57.716796875, 59.8056640625, 61.89453125, 63.9833984375, 66.072265625, 68.1611328125, 70.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 18.0, 27.0, 35.0, 36.0, 74.0, 110.0, 157.0, 238.0, 369.0, 557.0, 898.0, 1498.0, 2437.0, 3794.0, 6321.0, 10177.0, 16228.0, 26613.0, 43788.0, 72166.0, 120200.0, 200852.0, 347439.0, 711819.0, 2035070.0, 1444843.0, 536120.0, 285309.0, 168284.0, 100737.0, 60792.0, 36631.0, 22215.0, 13433.0, 8353.0, 4993.0, 3238.0, 2070.0, 1222.0, 783.0, 517.0, 321.0, 214.0, 144.0, 96.0, 43.0, 35.0, 40.0, 21.0, 25.0, 8.0, 13.0, 7.0, 0.0, 1.0, 2.0, 3.0], "bins": [-54.03125, -52.33349609375, -50.6357421875, -48.93798828125, -47.240234375, -45.54248046875, -43.8447265625, -42.14697265625, -40.44921875, -38.75146484375, -37.0537109375, -35.35595703125, -33.658203125, -31.96044921875, -30.2626953125, -28.56494140625, -26.8671875, -25.16943359375, -23.4716796875, -21.77392578125, -20.076171875, -18.37841796875, -16.6806640625, -14.98291015625, -13.28515625, -11.58740234375, -9.8896484375, -8.19189453125, -6.494140625, -4.79638671875, -3.0986328125, -1.40087890625, 0.296875, 1.99462890625, 3.6923828125, 5.39013671875, 7.087890625, 8.78564453125, 10.4833984375, 12.18115234375, 13.87890625, 15.57666015625, 17.2744140625, 18.97216796875, 20.669921875, 22.36767578125, 24.0654296875, 25.76318359375, 27.4609375, 29.15869140625, 30.8564453125, 32.55419921875, 34.251953125, 35.94970703125, 37.6474609375, 39.34521484375, 41.04296875, 42.74072265625, 44.4384765625, 46.13623046875, 47.833984375, 49.53173828125, 51.2294921875, 52.92724609375, 54.625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 6.0, 9.0, 11.0, 9.0, 15.0, 17.0, 35.0, 21.0, 32.0, 39.0, 41.0, 42.0, 55.0, 82.0, 120.0, 191.0, 265.0, 291.0, 219.0, 110.0, 75.0, 52.0, 55.0, 38.0, 29.0, 26.0, 23.0, 21.0, 17.0, 8.0, 8.0, 16.0, 6.0, 8.0, 8.0, 6.0, 2.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.375, -77.4052734375, -74.435546875, -71.4658203125, -68.49609375, -65.5263671875, -62.556640625, -59.5869140625, -56.6171875, -53.6474609375, -50.677734375, -47.7080078125, -44.73828125, -41.7685546875, -38.798828125, -35.8291015625, -32.859375, -29.8896484375, -26.919921875, -23.9501953125, -20.98046875, -18.0107421875, -15.041015625, -12.0712890625, -9.1015625, -6.1318359375, -3.162109375, -0.1923828125, 2.77734375, 5.7470703125, 8.716796875, 11.6865234375, 14.65625, 17.6259765625, 20.595703125, 23.5654296875, 26.53515625, 29.5048828125, 32.474609375, 35.4443359375, 38.4140625, 41.3837890625, 44.353515625, 47.3232421875, 50.29296875, 53.2626953125, 56.232421875, 59.2021484375, 62.171875, 65.1416015625, 68.111328125, 71.0810546875, 74.05078125, 77.0205078125, 79.990234375, 82.9599609375, 85.9296875, 88.8994140625, 91.869140625, 94.8388671875, 97.80859375, 100.7783203125, 103.748046875, 106.7177734375, 109.6875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 5.0, 10.0, 8.0, 25.0, 43.0, 56.0, 93.0, 102.0, 135.0, 228.0, 310.0, 446.0, 625.0, 887.0, 1264.0, 1819.0, 2545.0, 3713.0, 5343.0, 7789.0, 11437.0, 17611.0, 27081.0, 43863.0, 75192.0, 176320.0, 5419130.0, 271450.0, 85783.0, 48318.0, 29903.0, 19478.0, 12715.0, 8397.0, 5788.0, 4074.0, 2810.0, 1894.0, 1403.0, 997.0, 707.0, 525.0, 335.0, 256.0, 175.0, 111.0, 85.0, 61.0, 44.0, 17.0, 16.0, 8.0, 8.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.5625, -97.1669921875, -93.771484375, -90.3759765625, -86.98046875, -83.5849609375, -80.189453125, -76.7939453125, -73.3984375, -70.0029296875, -66.607421875, -63.2119140625, -59.81640625, -56.4208984375, -53.025390625, -49.6298828125, -46.234375, -42.8388671875, -39.443359375, -36.0478515625, -32.65234375, -29.2568359375, -25.861328125, -22.4658203125, -19.0703125, -15.6748046875, -12.279296875, -8.8837890625, -5.48828125, -2.0927734375, 1.302734375, 4.6982421875, 8.09375, 11.4892578125, 14.884765625, 18.2802734375, 21.67578125, 25.0712890625, 28.466796875, 31.8623046875, 35.2578125, 38.6533203125, 42.048828125, 45.4443359375, 48.83984375, 52.2353515625, 55.630859375, 59.0263671875, 62.421875, 65.8173828125, 69.212890625, 72.6083984375, 76.00390625, 79.3994140625, 82.794921875, 86.1904296875, 89.5859375, 92.9814453125, 96.376953125, 99.7724609375, 103.16796875, 106.5634765625, 109.958984375, 113.3544921875, 116.75]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 13.0, 12.0, 12.0, 10.0, 18.0, 15.0, 19.0, 25.0, 29.0, 19.0, 40.0, 29.0, 33.0, 43.0, 52.0, 77.0, 152.0, 281.0, 404.0, 205.0, 97.0, 71.0, 36.0, 40.0, 36.0, 23.0, 31.0, 33.0, 20.0, 21.0, 14.0, 15.0, 12.0, 11.0, 14.0, 13.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-147.375, -142.685546875, -137.99609375, -133.306640625, -128.6171875, -123.927734375, -119.23828125, -114.548828125, -109.859375, -105.169921875, -100.48046875, -95.791015625, -91.1015625, -86.412109375, -81.72265625, -77.033203125, -72.34375, -67.654296875, -62.96484375, -58.275390625, -53.5859375, -48.896484375, -44.20703125, -39.517578125, -34.828125, -30.138671875, -25.44921875, -20.759765625, -16.0703125, -11.380859375, -6.69140625, -2.001953125, 2.6875, 7.376953125, 12.06640625, 16.755859375, 21.4453125, 26.134765625, 30.82421875, 35.513671875, 40.203125, 44.892578125, 49.58203125, 54.271484375, 58.9609375, 63.650390625, 68.33984375, 73.029296875, 77.71875, 82.408203125, 87.09765625, 91.787109375, 96.4765625, 101.166015625, 105.85546875, 110.544921875, 115.234375, 119.923828125, 124.61328125, 129.302734375, 133.9921875, 138.681640625, 143.37109375, 148.060546875, 152.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 10.0, 7.0, 7.0, 8.0, 14.0, 18.0, 23.0, 35.0, 48.0, 50.0, 63.0, 87.0, 159.0, 121.0, 61.0, 61.0, 47.0, 34.0, 30.0, 16.0, 17.0, 19.0, 14.0, 7.0, 10.0, 9.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2396.674072265625, -2304.192626953125, -2211.711181640625, -2119.229736328125, -2026.748291015625, -1934.266845703125, -1841.7852783203125, -1749.3038330078125, -1656.8223876953125, -1564.3409423828125, -1471.8594970703125, -1379.3779296875, -1286.896484375, -1194.4150390625, -1101.93359375, -1009.4521484375, -916.970703125, -824.4892578125, -732.0078125, -639.5263061523438, -547.0448608398438, -454.56341552734375, -362.0819091796875, -269.6004638671875, -177.1190185546875, -84.63755798339844, 7.843902587890625, 100.32537841796875, 192.80682373046875, 285.28826904296875, 377.769775390625, 470.251220703125, 562.732666015625, 655.214111328125, 747.695556640625, 840.1770629882812, 932.6585083007812, 1025.139892578125, 1117.6214599609375, 1210.1029052734375, 1302.5843505859375, 1395.0657958984375, 1487.5472412109375, 1580.02880859375, 1672.51025390625, 1764.99169921875, 1857.47314453125, 1949.95458984375, 2042.43603515625, 2134.91748046875, 2227.39892578125, 2319.88037109375, 2412.36181640625, 2504.84326171875, 2597.32470703125, 2689.80615234375, 2782.28759765625, 2874.76904296875, 2967.25048828125, 3059.73193359375, 3152.21337890625, 3244.69482421875, 3337.17626953125, 3429.65771484375, 3522.139404296875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 5.0, 6.0, 13.0, 6.0, 10.0, 10.0, 14.0, 19.0, 19.0, 17.0, 22.0, 18.0, 28.0, 23.0, 32.0, 47.0, 49.0, 81.0, 105.0, 76.0, 74.0, 44.0, 25.0, 27.0, 27.0, 23.0, 21.0, 25.0, 21.0, 16.0, 16.0, 16.0, 8.0, 9.0, 10.0, 11.0, 1.0, 2.0, 7.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3043.0244140625, -2941.0390625, -2839.053955078125, -2737.068603515625, -2635.08349609375, -2533.09814453125, -2431.11279296875, -2329.127685546875, -2227.142333984375, -2125.156982421875, -2023.171875, -1921.1865234375, -1819.2012939453125, -1717.216064453125, -1615.2308349609375, -1513.24560546875, -1411.2603759765625, -1309.275146484375, -1207.2899169921875, -1105.3046875, -1003.3193359375, -901.3341064453125, -799.348876953125, -697.3635864257812, -595.3783569335938, -493.3930969238281, -391.4078369140625, -289.422607421875, -187.43734741210938, -85.45208740234375, 16.53314208984375, 118.5184326171875, 220.503662109375, 322.4889221191406, 424.47418212890625, 526.4594116210938, 628.4447021484375, 730.429931640625, 832.4151611328125, 934.4004516601562, 1036.3857421875, 1138.3709716796875, 1240.356201171875, 1342.341552734375, 1444.3267822265625, 1546.31201171875, 1648.2972412109375, 1750.282470703125, 1852.2677001953125, 1954.2529296875, 2056.23828125, 2158.223388671875, 2260.208740234375, 2362.19384765625, 2464.17919921875, 2566.16455078125, 2668.149658203125, 2770.135009765625, 2872.1201171875, 2974.10546875, 3076.090576171875, 3178.075927734375, 3280.06103515625, 3382.04638671875, 3484.03173828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 4.0, 5.0, 16.0, 15.0, 27.0, 43.0, 83.0, 126.0, 208.0, 381.0, 660.0, 1029.0, 1616.0, 2868.0, 5176.0, 10051.0, 23423.0, 75797.0, 653358.0, 3228009.0, 139557.0, 32000.0, 10747.0, 4408.0, 2112.0, 1106.0, 588.0, 339.0, 187.0, 106.0, 75.0, 52.0, 36.0, 24.0, 17.0, 16.0, 3.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.328125, -28.416259765625, -27.50439453125, -26.592529296875, -25.6806640625, -24.768798828125, -23.85693359375, -22.945068359375, -22.033203125, -21.121337890625, -20.20947265625, -19.297607421875, -18.3857421875, -17.473876953125, -16.56201171875, -15.650146484375, -14.73828125, -13.826416015625, -12.91455078125, -12.002685546875, -11.0908203125, -10.178955078125, -9.26708984375, -8.355224609375, -7.443359375, -6.531494140625, -5.61962890625, -4.707763671875, -3.7958984375, -2.884033203125, -1.97216796875, -1.060302734375, -0.1484375, 0.763427734375, 1.67529296875, 2.587158203125, 3.4990234375, 4.410888671875, 5.32275390625, 6.234619140625, 7.146484375, 8.058349609375, 8.97021484375, 9.882080078125, 10.7939453125, 11.705810546875, 12.61767578125, 13.529541015625, 14.44140625, 15.353271484375, 16.26513671875, 17.177001953125, 18.0888671875, 19.000732421875, 19.91259765625, 20.824462890625, 21.736328125, 22.648193359375, 23.56005859375, 24.471923828125, 25.3837890625, 26.295654296875, 27.20751953125, 28.119384765625, 29.03125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 6.0, 6.0, 8.0, 4.0, 17.0, 26.0, 38.0, 54.0, 87.0, 96.0, 165.0, 142.0, 89.0, 83.0, 53.0, 33.0, 33.0, 16.0, 8.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.79296875, -3.65155029296875, -3.5101318359375, -3.36871337890625, -3.227294921875, -3.08587646484375, -2.9444580078125, -2.80303955078125, -2.66162109375, -2.52020263671875, -2.3787841796875, -2.23736572265625, -2.095947265625, -1.95452880859375, -1.8131103515625, -1.67169189453125, -1.5302734375, -1.38885498046875, -1.2474365234375, -1.10601806640625, -0.964599609375, -0.82318115234375, -0.6817626953125, -0.54034423828125, -0.39892578125, -0.25750732421875, -0.1160888671875, 0.02532958984375, 0.166748046875, 0.30816650390625, 0.4495849609375, 0.59100341796875, 0.732421875, 0.87384033203125, 1.0152587890625, 1.15667724609375, 1.298095703125, 1.43951416015625, 1.5809326171875, 1.72235107421875, 1.86376953125, 2.00518798828125, 2.1466064453125, 2.28802490234375, 2.429443359375, 2.57086181640625, 2.7122802734375, 2.85369873046875, 2.9951171875, 3.13653564453125, 3.2779541015625, 3.41937255859375, 3.560791015625, 3.70220947265625, 3.8436279296875, 3.98504638671875, 4.12646484375, 4.26788330078125, 4.4093017578125, 4.55072021484375, 4.692138671875, 4.83355712890625, 4.9749755859375, 5.11639404296875, 5.2578125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 1.0, 5.0, 14.0, 12.0, 24.0, 21.0, 28.0, 51.0, 77.0, 90.0, 163.0, 209.0, 353.0, 582.0, 911.0, 1568.0, 2694.0, 4944.0, 9157.0, 17976.0, 38070.0, 86314.0, 228095.0, 856772.0, 2265271.0, 432912.0, 139687.0, 56128.0, 25477.0, 12288.0, 6340.0, 3415.0, 1812.0, 1095.0, 646.0, 373.0, 263.0, 153.0, 92.0, 65.0, 46.0, 30.0, 17.0, 15.0, 6.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.5234375, -15.0269775390625, -14.530517578125, -14.0340576171875, -13.53759765625, -13.0411376953125, -12.544677734375, -12.0482177734375, -11.5517578125, -11.0552978515625, -10.558837890625, -10.0623779296875, -9.56591796875, -9.0694580078125, -8.572998046875, -8.0765380859375, -7.580078125, -7.0836181640625, -6.587158203125, -6.0906982421875, -5.59423828125, -5.0977783203125, -4.601318359375, -4.1048583984375, -3.6083984375, -3.1119384765625, -2.615478515625, -2.1190185546875, -1.62255859375, -1.1260986328125, -0.629638671875, -0.1331787109375, 0.36328125, 0.8597412109375, 1.356201171875, 1.8526611328125, 2.34912109375, 2.8455810546875, 3.342041015625, 3.8385009765625, 4.3349609375, 4.8314208984375, 5.327880859375, 5.8243408203125, 6.32080078125, 6.8172607421875, 7.313720703125, 7.8101806640625, 8.306640625, 8.8031005859375, 9.299560546875, 9.7960205078125, 10.29248046875, 10.7889404296875, 11.285400390625, 11.7818603515625, 12.2783203125, 12.7747802734375, 13.271240234375, 13.7677001953125, 14.26416015625, 14.7606201171875, 15.257080078125, 15.7535400390625, 16.25]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 8.0, 6.0, 12.0, 16.0, 18.0, 25.0, 32.0, 42.0, 45.0, 62.0, 81.0, 99.0, 127.0, 152.0, 219.0, 298.0, 518.0, 844.0, 430.0, 254.0, 199.0, 141.0, 105.0, 70.0, 58.0, 51.0, 44.0, 26.0, 19.0, 13.0, 18.0, 5.0, 10.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.73828125, -7.5306396484375, -7.322998046875, -7.1153564453125, -6.90771484375, -6.7000732421875, -6.492431640625, -6.2847900390625, -6.0771484375, -5.8695068359375, -5.661865234375, -5.4542236328125, -5.24658203125, -5.0389404296875, -4.831298828125, -4.6236572265625, -4.416015625, -4.2083740234375, -4.000732421875, -3.7930908203125, -3.58544921875, -3.3778076171875, -3.170166015625, -2.9625244140625, -2.7548828125, -2.5472412109375, -2.339599609375, -2.1319580078125, -1.92431640625, -1.7166748046875, -1.509033203125, -1.3013916015625, -1.09375, -0.8861083984375, -0.678466796875, -0.4708251953125, -0.26318359375, -0.0555419921875, 0.152099609375, 0.3597412109375, 0.5673828125, 0.7750244140625, 0.982666015625, 1.1903076171875, 1.39794921875, 1.6055908203125, 1.813232421875, 2.0208740234375, 2.228515625, 2.4361572265625, 2.643798828125, 2.8514404296875, 3.05908203125, 3.2667236328125, 3.474365234375, 3.6820068359375, 3.8896484375, 4.0972900390625, 4.304931640625, 4.5125732421875, 4.72021484375, 4.9278564453125, 5.135498046875, 5.3431396484375, 5.55078125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 5.0, 8.0, 12.0, 12.0, 13.0, 24.0, 28.0, 50.0, 67.0, 61.0, 93.0, 92.0, 99.0, 111.0, 81.0, 66.0, 45.0, 50.0, 22.0, 15.0, 10.0, 13.0, 4.0, 4.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.39988708496094, -46.92252731323242, -45.445167541503906, -43.96780776977539, -42.490447998046875, -41.01308822631836, -39.535728454589844, -38.05836868286133, -36.58100891113281, -35.1036491394043, -33.62628936767578, -32.148929595947266, -30.67156982421875, -29.194210052490234, -27.71685028076172, -26.239490509033203, -24.762128829956055, -23.28476905822754, -21.807409286499023, -20.330049514770508, -18.852689743041992, -17.375329971313477, -15.897969245910645, -14.420609474182129, -12.943249702453613, -11.465889930725098, -9.988530158996582, -8.51116943359375, -7.033810138702393, -5.556450366973877, -4.079090118408203, -2.6017303466796875, -1.1243705749511719, 0.3529893159866333, 1.8303492069244385, 3.307709217071533, 4.785068988800049, 6.2624287605285645, 7.739789009094238, 9.217148780822754, 10.69450855255127, 12.171868324279785, 13.6492280960083, 15.126588821411133, 16.60394859313965, 18.081308364868164, 19.55866813659668, 21.036027908325195, 22.51338768005371, 23.990747451782227, 25.468107223510742, 26.945466995239258, 28.422826766967773, 29.90018653869629, 31.377548217773438, 32.85490798950195, 34.33226776123047, 35.809627532958984, 37.2869873046875, 38.764347076416016, 40.24170684814453, 41.71906661987305, 43.19642639160156, 44.67378616333008, 46.151145935058594]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 7.0, 10.0, 15.0, 13.0, 18.0, 18.0, 15.0, 22.0, 23.0, 23.0, 34.0, 31.0, 37.0, 31.0, 39.0, 45.0, 41.0, 33.0, 45.0, 35.0, 38.0, 39.0, 43.0, 42.0, 35.0, 27.0, 32.0, 26.0, 22.0, 23.0, 15.0, 16.0, 16.0, 15.0, 15.0, 10.0, 9.0, 2.0, 4.0, 6.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.855472564697266, -27.86359405517578, -26.871715545654297, -25.879837036132812, -24.887958526611328, -23.896080017089844, -22.90420150756836, -21.912322998046875, -20.92044448852539, -19.928565979003906, -18.936687469482422, -17.944808959960938, -16.952930450439453, -15.961051940917969, -14.969173431396484, -13.977294921875, -12.985416412353516, -11.993537902832031, -11.001659393310547, -10.009780883789062, -9.017902374267578, -8.026023864746094, -7.034145355224609, -6.042266845703125, -5.050388336181641, -4.058509826660156, -3.066631317138672, -2.0747528076171875, -1.0828742980957031, -0.09099578857421875, 0.9008827209472656, 1.89276123046875, 2.8846397399902344, 3.8765182495117188, 4.868396759033203, 5.8602752685546875, 6.852153778076172, 7.844032287597656, 8.83591079711914, 9.827789306640625, 10.81966781616211, 11.811546325683594, 12.803424835205078, 13.795303344726562, 14.787181854248047, 15.779060363769531, 16.770938873291016, 17.7628173828125, 18.754695892333984, 19.74657440185547, 20.738452911376953, 21.730331420898438, 22.722209930419922, 23.714088439941406, 24.70596694946289, 25.697845458984375, 26.68972396850586, 27.681602478027344, 28.673480987548828, 29.665359497070312, 30.657238006591797, 31.64911651611328, 32.640995025634766, 33.63287353515625, 34.624752044677734]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 23.0, 26.0, 38.0, 72.0, 70.0, 120.0, 164.0, 244.0, 365.0, 534.0, 786.0, 1239.0, 2012.0, 3753.0, 7744.0, 19971.0, 69384.0, 464456.0, 380759.0, 61780.0, 18404.0, 7274.0, 3768.0, 2028.0, 1201.0, 794.0, 520.0, 308.0, 228.0, 141.0, 95.0, 72.0, 36.0, 23.0, 26.0, 7.0, 8.0, 14.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.6171875, -14.1124267578125, -13.607666015625, -13.1029052734375, -12.59814453125, -12.0933837890625, -11.588623046875, -11.0838623046875, -10.5791015625, -10.0743408203125, -9.569580078125, -9.0648193359375, -8.56005859375, -8.0552978515625, -7.550537109375, -7.0457763671875, -6.541015625, -6.0362548828125, -5.531494140625, -5.0267333984375, -4.52197265625, -4.0172119140625, -3.512451171875, -3.0076904296875, -2.5029296875, -1.9981689453125, -1.493408203125, -0.9886474609375, -0.48388671875, 0.0208740234375, 0.525634765625, 1.0303955078125, 1.53515625, 2.0399169921875, 2.544677734375, 3.0494384765625, 3.55419921875, 4.0589599609375, 4.563720703125, 5.0684814453125, 5.5732421875, 6.0780029296875, 6.582763671875, 7.0875244140625, 7.59228515625, 8.0970458984375, 8.601806640625, 9.1065673828125, 9.611328125, 10.1160888671875, 10.620849609375, 11.1256103515625, 11.63037109375, 12.1351318359375, 12.639892578125, 13.1446533203125, 13.6494140625, 14.1541748046875, 14.658935546875, 15.1636962890625, 15.66845703125, 16.1732177734375, 16.677978515625, 17.1827392578125, 17.6875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 1.0, 3.0, 7.0, 5.0, 12.0, 23.0, 43.0, 72.0, 93.0, 117.0, 128.0, 131.0, 124.0, 66.0, 55.0, 37.0, 27.0, 17.0, 11.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23828125, -4.073486328125, -3.90869140625, -3.743896484375, -3.5791015625, -3.414306640625, -3.24951171875, -3.084716796875, -2.919921875, -2.755126953125, -2.59033203125, -2.425537109375, -2.2607421875, -2.095947265625, -1.93115234375, -1.766357421875, -1.6015625, -1.436767578125, -1.27197265625, -1.107177734375, -0.9423828125, -0.777587890625, -0.61279296875, -0.447998046875, -0.283203125, -0.118408203125, 0.04638671875, 0.211181640625, 0.3759765625, 0.540771484375, 0.70556640625, 0.870361328125, 1.03515625, 1.199951171875, 1.36474609375, 1.529541015625, 1.6943359375, 1.859130859375, 2.02392578125, 2.188720703125, 2.353515625, 2.518310546875, 2.68310546875, 2.847900390625, 3.0126953125, 3.177490234375, 3.34228515625, 3.507080078125, 3.671875, 3.836669921875, 4.00146484375, 4.166259765625, 4.3310546875, 4.495849609375, 4.66064453125, 4.825439453125, 4.990234375, 5.155029296875, 5.31982421875, 5.484619140625, 5.6494140625, 5.814208984375, 5.97900390625, 6.143798828125, 6.30859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 8.0, 6.0, 7.0, 8.0, 24.0, 38.0, 69.0, 73.0, 131.0, 176.0, 299.0, 517.0, 799.0, 1344.0, 2374.0, 4005.0, 6966.0, 13019.0, 25641.0, 54330.0, 136180.0, 445886.0, 210882.0, 74490.0, 33743.0, 16673.0, 8854.0, 4968.0, 2784.0, 1644.0, 968.0, 606.0, 372.0, 225.0, 146.0, 98.0, 62.0, 47.0, 24.0, 21.0, 11.0, 8.0, 6.0, 10.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1796875, -12.7884521484375, -12.397216796875, -12.0059814453125, -11.61474609375, -11.2235107421875, -10.832275390625, -10.4410400390625, -10.0498046875, -9.6585693359375, -9.267333984375, -8.8760986328125, -8.48486328125, -8.0936279296875, -7.702392578125, -7.3111572265625, -6.919921875, -6.5286865234375, -6.137451171875, -5.7462158203125, -5.35498046875, -4.9637451171875, -4.572509765625, -4.1812744140625, -3.7900390625, -3.3988037109375, -3.007568359375, -2.6163330078125, -2.22509765625, -1.8338623046875, -1.442626953125, -1.0513916015625, -0.66015625, -0.2689208984375, 0.122314453125, 0.5135498046875, 0.90478515625, 1.2960205078125, 1.687255859375, 2.0784912109375, 2.4697265625, 2.8609619140625, 3.252197265625, 3.6434326171875, 4.03466796875, 4.4259033203125, 4.817138671875, 5.2083740234375, 5.599609375, 5.9908447265625, 6.382080078125, 6.7733154296875, 7.16455078125, 7.5557861328125, 7.947021484375, 8.3382568359375, 8.7294921875, 9.1207275390625, 9.511962890625, 9.9031982421875, 10.29443359375, 10.6856689453125, 11.076904296875, 11.4681396484375, 11.859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 4.0, 8.0, 13.0, 12.0, 15.0, 14.0, 16.0, 19.0, 24.0, 19.0, 27.0, 32.0, 26.0, 46.0, 27.0, 44.0, 32.0, 42.0, 40.0, 46.0, 42.0, 48.0, 39.0, 34.0, 36.0, 36.0, 34.0, 41.0, 36.0, 20.0, 25.0, 17.0, 14.0, 13.0, 4.0, 10.0, 11.0, 9.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3984375, -12.9661865234375, -12.533935546875, -12.1016845703125, -11.66943359375, -11.2371826171875, -10.804931640625, -10.3726806640625, -9.9404296875, -9.5081787109375, -9.075927734375, -8.6436767578125, -8.21142578125, -7.7791748046875, -7.346923828125, -6.9146728515625, -6.482421875, -6.0501708984375, -5.617919921875, -5.1856689453125, -4.75341796875, -4.3211669921875, -3.888916015625, -3.4566650390625, -3.0244140625, -2.5921630859375, -2.159912109375, -1.7276611328125, -1.29541015625, -0.8631591796875, -0.430908203125, 0.0013427734375, 0.43359375, 0.8658447265625, 1.298095703125, 1.7303466796875, 2.16259765625, 2.5948486328125, 3.027099609375, 3.4593505859375, 3.8916015625, 4.3238525390625, 4.756103515625, 5.1883544921875, 5.62060546875, 6.0528564453125, 6.485107421875, 6.9173583984375, 7.349609375, 7.7818603515625, 8.214111328125, 8.6463623046875, 9.07861328125, 9.5108642578125, 9.943115234375, 10.3753662109375, 10.8076171875, 11.2398681640625, 11.672119140625, 12.1043701171875, 12.53662109375, 12.9688720703125, 13.401123046875, 13.8333740234375, 14.265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 6.0, 5.0, 11.0, 6.0, 18.0, 12.0, 14.0, 34.0, 35.0, 49.0, 81.0, 98.0, 166.0, 302.0, 476.0, 910.0, 1868.0, 4352.0, 10999.0, 34189.0, 160408.0, 599087.0, 177771.0, 37176.0, 11586.0, 4599.0, 1991.0, 975.0, 516.0, 277.0, 182.0, 97.0, 49.0, 54.0, 27.0, 33.0, 20.0, 15.0, 19.0, 10.0, 10.0, 3.0, 6.0, 1.0, 3.0, 8.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-11.28125, -10.9344482421875, -10.587646484375, -10.2408447265625, -9.89404296875, -9.5472412109375, -9.200439453125, -8.8536376953125, -8.5068359375, -8.1600341796875, -7.813232421875, -7.4664306640625, -7.11962890625, -6.7728271484375, -6.426025390625, -6.0792236328125, -5.732421875, -5.3856201171875, -5.038818359375, -4.6920166015625, -4.34521484375, -3.9984130859375, -3.651611328125, -3.3048095703125, -2.9580078125, -2.6112060546875, -2.264404296875, -1.9176025390625, -1.57080078125, -1.2239990234375, -0.877197265625, -0.5303955078125, -0.18359375, 0.1632080078125, 0.510009765625, 0.8568115234375, 1.20361328125, 1.5504150390625, 1.897216796875, 2.2440185546875, 2.5908203125, 2.9376220703125, 3.284423828125, 3.6312255859375, 3.97802734375, 4.3248291015625, 4.671630859375, 5.0184326171875, 5.365234375, 5.7120361328125, 6.058837890625, 6.4056396484375, 6.75244140625, 7.0992431640625, 7.446044921875, 7.7928466796875, 8.1396484375, 8.4864501953125, 8.833251953125, 9.1800537109375, 9.52685546875, 9.8736572265625, 10.220458984375, 10.5672607421875, 10.9140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 7.0, 3.0, 5.0, 6.0, 11.0, 14.0, 22.0, 14.0, 25.0, 34.0, 37.0, 60.0, 102.0, 92.0, 95.0, 84.0, 81.0, 81.0, 58.0, 51.0, 25.0, 25.0, 14.0, 13.0, 14.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008211135864257812, -0.0007904917001724243, -0.0007598698139190674, -0.0007292479276657104, -0.0006986260414123535, -0.0006680041551589966, -0.0006373822689056396, -0.0006067603826522827, -0.0005761384963989258, -0.0005455166101455688, -0.0005148947238922119, -0.000484272837638855, -0.00045365095138549805, -0.0004230290651321411, -0.0003924071788787842, -0.00036178529262542725, -0.0003311634063720703, -0.0003005415201187134, -0.00026991963386535645, -0.0002392977476119995, -0.00020867586135864258, -0.00017805397510528564, -0.0001474320888519287, -0.00011681020259857178, -8.618831634521484e-05, -5.556643009185791e-05, -2.4944543838500977e-05, 5.677342414855957e-06, 3.629922866821289e-05, 6.692111492156982e-05, 9.754300117492676e-05, 0.0001281648874282837, 0.00015878677368164062, 0.00018940865993499756, 0.0002200305461883545, 0.0002506524324417114, 0.00028127431869506836, 0.0003118962049484253, 0.0003425180912017822, 0.00037313997745513916, 0.0004037618637084961, 0.00043438374996185303, 0.00046500563621520996, 0.0004956275224685669, 0.0005262494087219238, 0.0005568712949752808, 0.0005874931812286377, 0.0006181150674819946, 0.0006487369537353516, 0.0006793588399887085, 0.0007099807262420654, 0.0007406026124954224, 0.0007712244987487793, 0.0008018463850021362, 0.0008324682712554932, 0.0008630901575088501, 0.000893712043762207, 0.000924333930015564, 0.0009549558162689209, 0.0009855777025222778, 0.0010161995887756348, 0.0010468214750289917, 0.0010774433612823486, 0.0011080652475357056, 0.0011386871337890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 11.0, 5.0, 9.0, 12.0, 29.0, 40.0, 52.0, 83.0, 114.0, 207.0, 317.0, 475.0, 715.0, 1187.0, 2171.0, 4111.0, 8467.0, 18944.0, 47906.0, 145887.0, 435294.0, 253623.0, 76643.0, 27942.0, 11700.0, 5567.0, 2862.0, 1634.0, 940.0, 548.0, 372.0, 223.0, 128.0, 92.0, 80.0, 48.0, 44.0, 28.0, 9.0, 13.0, 6.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.015625, -6.7713623046875, -6.527099609375, -6.2828369140625, -6.03857421875, -5.7943115234375, -5.550048828125, -5.3057861328125, -5.0615234375, -4.8172607421875, -4.572998046875, -4.3287353515625, -4.08447265625, -3.8402099609375, -3.595947265625, -3.3516845703125, -3.107421875, -2.8631591796875, -2.618896484375, -2.3746337890625, -2.13037109375, -1.8861083984375, -1.641845703125, -1.3975830078125, -1.1533203125, -0.9090576171875, -0.664794921875, -0.4205322265625, -0.17626953125, 0.0679931640625, 0.312255859375, 0.5565185546875, 0.80078125, 1.0450439453125, 1.289306640625, 1.5335693359375, 1.77783203125, 2.0220947265625, 2.266357421875, 2.5106201171875, 2.7548828125, 2.9991455078125, 3.243408203125, 3.4876708984375, 3.73193359375, 3.9761962890625, 4.220458984375, 4.4647216796875, 4.708984375, 4.9532470703125, 5.197509765625, 5.4417724609375, 5.68603515625, 5.9302978515625, 6.174560546875, 6.4188232421875, 6.6630859375, 6.9073486328125, 7.151611328125, 7.3958740234375, 7.64013671875, 7.8843994140625, 8.128662109375, 8.3729248046875, 8.6171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 7.0, 4.0, 13.0, 12.0, 23.0, 15.0, 21.0, 28.0, 30.0, 38.0, 47.0, 45.0, 51.0, 54.0, 62.0, 66.0, 72.0, 59.0, 69.0, 39.0, 49.0, 33.0, 30.0, 21.0, 20.0, 14.0, 14.0, 15.0, 8.0, 8.0, 7.0, 7.0, 2.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.43865966796875, -5.2640380859375, -5.08941650390625, -4.914794921875, -4.74017333984375, -4.5655517578125, -4.39093017578125, -4.21630859375, -4.04168701171875, -3.8670654296875, -3.69244384765625, -3.517822265625, -3.34320068359375, -3.1685791015625, -2.99395751953125, -2.8193359375, -2.64471435546875, -2.4700927734375, -2.29547119140625, -2.120849609375, -1.94622802734375, -1.7716064453125, -1.59698486328125, -1.42236328125, -1.24774169921875, -1.0731201171875, -0.89849853515625, -0.723876953125, -0.54925537109375, -0.3746337890625, -0.20001220703125, -0.025390625, 0.14923095703125, 0.3238525390625, 0.49847412109375, 0.673095703125, 0.84771728515625, 1.0223388671875, 1.19696044921875, 1.37158203125, 1.54620361328125, 1.7208251953125, 1.89544677734375, 2.070068359375, 2.24468994140625, 2.4193115234375, 2.59393310546875, 2.7685546875, 2.94317626953125, 3.1177978515625, 3.29241943359375, 3.467041015625, 3.64166259765625, 3.8162841796875, 3.99090576171875, 4.16552734375, 4.34014892578125, 4.5147705078125, 4.68939208984375, 4.864013671875, 5.03863525390625, 5.2132568359375, 5.38787841796875, 5.5625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 14.0, 33.0, 45.0, 99.0, 250.0, 296.0, 111.0, 68.0, 34.0, 16.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-258.2933654785156, -251.33868408203125, -244.3839874267578, -237.42930603027344, -230.47462463378906, -223.51992797851562, -216.56524658203125, -209.61056518554688, -202.6558837890625, -195.70120239257812, -188.7465057373047, -181.7918243408203, -174.83714294433594, -167.8824462890625, -160.92776489257812, -153.97308349609375, -147.0183868408203, -140.06370544433594, -133.1090087890625, -126.15432739257812, -119.19964599609375, -112.24495697021484, -105.29026794433594, -98.33558654785156, -91.38089752197266, -84.42620849609375, -77.47152709960938, -70.51683807373047, -63.56215286254883, -56.60746765136719, -49.65277862548828, -42.69809341430664, -35.743408203125, -28.78872299194336, -21.834035873413086, -14.879348754882812, -7.924663543701172, -0.9699783325195312, 5.984710693359375, 12.939395904541016, 19.894081115722656, 26.848766326904297, 33.80345153808594, 40.758140563964844, 47.712825775146484, 54.667510986328125, 61.62220001220703, 68.57688903808594, 75.53157043457031, 82.48625946044922, 89.4409408569336, 96.3956298828125, 103.35031127929688, 110.30500030517578, 117.25968933105469, 124.21437072753906, 131.1690673828125, 138.12374877929688, 145.0784454345703, 152.0331268310547, 158.98780822753906, 165.9425048828125, 172.89718627929688, 179.85186767578125, 186.80654907226562]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 11.0, 13.0, 7.0, 16.0, 23.0, 47.0, 88.0, 141.0, 179.0, 149.0, 118.0, 74.0, 36.0, 26.0, 12.0, 10.0, 7.0, 7.0, 1.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-230.62716674804688, -221.70372009277344, -212.78025817871094, -203.8568115234375, -194.933349609375, -186.00990295410156, -177.08645629882812, -168.16299438476562, -159.2395477294922, -150.31610107421875, -141.39263916015625, -132.4691925048828, -123.54573822021484, -114.62228393554688, -105.69883728027344, -96.77538299560547, -87.8519287109375, -78.92847442626953, -70.00502014160156, -61.081573486328125, -52.158119201660156, -43.23466491699219, -34.311214447021484, -25.38776397705078, -16.464309692382812, -7.540857315063477, 1.3825950622558594, 10.306047439575195, 19.22949981689453, 28.1529541015625, 37.0764045715332, 45.999855041503906, 54.92333984375, 63.84679412841797, 72.77024841308594, 81.69369506835938, 90.61714935302734, 99.54060363769531, 108.46405029296875, 117.38750457763672, 126.31095886230469, 135.23440551757812, 144.15786743164062, 153.08131408691406, 162.0047607421875, 170.92822265625, 179.85166931152344, 188.77511596679688, 197.69857788085938, 206.6220245361328, 215.5454864501953, 224.46893310546875, 233.39239501953125, 242.3158416748047, 251.23928833007812, 260.1627502441406, 269.086181640625, 278.0096435546875, 286.9330749511719, 295.8565368652344, 304.7799987792969, 313.70343017578125, 322.62689208984375, 331.55035400390625, 340.47381591796875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 6.0, 11.0, 18.0, 19.0, 49.0, 86.0, 174.0, 322.0, 701.0, 1379.0, 3540.0, 10439.0, 52685.0, 3781214.0, 307449.0, 26344.0, 6054.0, 2035.0, 799.0, 420.0, 209.0, 135.0, 68.0, 39.0, 26.0, 17.0, 9.0, 9.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.375, -62.140625, -59.90625, -57.671875, -55.4375, -53.203125, -50.96875, -48.734375, -46.5, -44.265625, -42.03125, -39.796875, -37.5625, -35.328125, -33.09375, -30.859375, -28.625, -26.390625, -24.15625, -21.921875, -19.6875, -17.453125, -15.21875, -12.984375, -10.75, -8.515625, -6.28125, -4.046875, -1.8125, 0.421875, 2.65625, 4.890625, 7.125, 9.359375, 11.59375, 13.828125, 16.0625, 18.296875, 20.53125, 22.765625, 25.0, 27.234375, 29.46875, 31.703125, 33.9375, 36.171875, 38.40625, 40.640625, 42.875, 45.109375, 47.34375, 49.578125, 51.8125, 54.046875, 56.28125, 58.515625, 60.75, 62.984375, 65.21875, 67.453125, 69.6875, 71.921875, 74.15625, 76.390625, 78.625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 6.0, 12.0, 9.0, 7.0, 11.0, 17.0, 26.0, 37.0, 59.0, 65.0, 87.0, 94.0, 105.0, 120.0, 85.0, 66.0, 44.0, 44.0, 29.0, 20.0, 21.0, 8.0, 9.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0390625, -2.90386962890625, -2.7686767578125, -2.63348388671875, -2.498291015625, -2.36309814453125, -2.2279052734375, -2.09271240234375, -1.95751953125, -1.82232666015625, -1.6871337890625, -1.55194091796875, -1.416748046875, -1.28155517578125, -1.1463623046875, -1.01116943359375, -0.8759765625, -0.74078369140625, -0.6055908203125, -0.47039794921875, -0.335205078125, -0.20001220703125, -0.0648193359375, 0.07037353515625, 0.20556640625, 0.34075927734375, 0.4759521484375, 0.61114501953125, 0.746337890625, 0.88153076171875, 1.0167236328125, 1.15191650390625, 1.287109375, 1.42230224609375, 1.5574951171875, 1.69268798828125, 1.827880859375, 1.96307373046875, 2.0982666015625, 2.23345947265625, 2.36865234375, 2.50384521484375, 2.6390380859375, 2.77423095703125, 2.909423828125, 3.04461669921875, 3.1798095703125, 3.31500244140625, 3.4501953125, 3.58538818359375, 3.7205810546875, 3.85577392578125, 3.990966796875, 4.12615966796875, 4.2613525390625, 4.39654541015625, 4.53173828125, 4.66693115234375, 4.8021240234375, 4.93731689453125, 5.072509765625, 5.20770263671875, 5.3428955078125, 5.47808837890625, 5.61328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 16.0, 16.0, 25.0, 32.0, 50.0, 71.0, 93.0, 154.0, 246.0, 367.0, 639.0, 1029.0, 1862.0, 3334.0, 6262.0, 12954.0, 29057.0, 78145.0, 317399.0, 3295717.0, 315678.0, 76740.0, 28324.0, 12508.0, 6061.0, 3207.0, 1726.0, 942.0, 548.0, 376.0, 220.0, 134.0, 93.0, 80.0, 52.0, 33.0, 25.0, 18.0, 9.0, 11.0, 8.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-32.0625, -31.075927734375, -30.08935546875, -29.102783203125, -28.1162109375, -27.129638671875, -26.14306640625, -25.156494140625, -24.169921875, -23.183349609375, -22.19677734375, -21.210205078125, -20.2236328125, -19.237060546875, -18.25048828125, -17.263916015625, -16.27734375, -15.290771484375, -14.30419921875, -13.317626953125, -12.3310546875, -11.344482421875, -10.35791015625, -9.371337890625, -8.384765625, -7.398193359375, -6.41162109375, -5.425048828125, -4.4384765625, -3.451904296875, -2.46533203125, -1.478759765625, -0.4921875, 0.494384765625, 1.48095703125, 2.467529296875, 3.4541015625, 4.440673828125, 5.42724609375, 6.413818359375, 7.400390625, 8.386962890625, 9.37353515625, 10.360107421875, 11.3466796875, 12.333251953125, 13.31982421875, 14.306396484375, 15.29296875, 16.279541015625, 17.26611328125, 18.252685546875, 19.2392578125, 20.225830078125, 21.21240234375, 22.198974609375, 23.185546875, 24.172119140625, 25.15869140625, 26.145263671875, 27.1318359375, 28.118408203125, 29.10498046875, 30.091552734375, 31.078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 5.0, 12.0, 16.0, 9.0, 18.0, 20.0, 23.0, 34.0, 50.0, 55.0, 83.0, 147.0, 254.0, 460.0, 2035.0, 326.0, 162.0, 101.0, 59.0, 65.0, 42.0, 18.0, 19.0, 9.0, 11.0, 6.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.78717041015625, -4.5977783203125, -4.40838623046875, -4.218994140625, -4.02960205078125, -3.8402099609375, -3.65081787109375, -3.46142578125, -3.27203369140625, -3.0826416015625, -2.89324951171875, -2.703857421875, -2.51446533203125, -2.3250732421875, -2.13568115234375, -1.9462890625, -1.75689697265625, -1.5675048828125, -1.37811279296875, -1.188720703125, -0.99932861328125, -0.8099365234375, -0.62054443359375, -0.43115234375, -0.24176025390625, -0.0523681640625, 0.13702392578125, 0.326416015625, 0.51580810546875, 0.7052001953125, 0.89459228515625, 1.083984375, 1.27337646484375, 1.4627685546875, 1.65216064453125, 1.841552734375, 2.03094482421875, 2.2203369140625, 2.40972900390625, 2.59912109375, 2.78851318359375, 2.9779052734375, 3.16729736328125, 3.356689453125, 3.54608154296875, 3.7354736328125, 3.92486572265625, 4.1142578125, 4.30364990234375, 4.4930419921875, 4.68243408203125, 4.871826171875, 5.06121826171875, 5.2506103515625, 5.44000244140625, 5.62939453125, 5.81878662109375, 6.0081787109375, 6.19757080078125, 6.386962890625, 6.57635498046875, 6.7657470703125, 6.95513916015625, 7.14453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 11.0, 3.0, 8.0, 17.0, 10.0, 28.0, 63.0, 63.0, 130.0, 172.0, 161.0, 134.0, 64.0, 64.0, 25.0, 17.0, 11.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.96562194824219, -61.54591751098633, -60.1262092590332, -58.706504821777344, -57.28679656982422, -55.86709213256836, -54.4473876953125, -53.027679443359375, -51.607975006103516, -50.188270568847656, -48.76856231689453, -47.34885787963867, -45.92915344238281, -44.50944519042969, -43.08974075317383, -41.67003631591797, -40.250328063964844, -38.830623626708984, -37.41091537475586, -35.9912109375, -34.571502685546875, -33.151798248291016, -31.732093811035156, -30.312387466430664, -28.892681121826172, -27.47297477722168, -26.053268432617188, -24.633563995361328, -23.213857650756836, -21.794151306152344, -20.374446868896484, -18.954740524291992, -17.5350341796875, -16.115327835083008, -14.695622444152832, -13.275917053222656, -11.856210708618164, -10.436504364013672, -9.016798973083496, -7.59709358215332, -6.177387237548828, -4.757681369781494, -3.33797550201416, -1.9182696342468262, -0.4985637664794922, 0.9211421012878418, 2.340847969055176, 3.7605533599853516, 5.180259704589844, 6.599965572357178, 8.019671440124512, 9.439376831054688, 10.85908317565918, 12.278789520263672, 13.698494911193848, 15.118200302124023, 16.537906646728516, 17.957612991333008, 19.3773193359375, 20.79702377319336, 22.21673011779785, 23.636436462402344, 25.056140899658203, 26.475847244262695, 27.895553588867188]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 7.0, 8.0, 15.0, 14.0, 20.0, 25.0, 31.0, 37.0, 42.0, 57.0, 51.0, 57.0, 70.0, 60.0, 55.0, 63.0, 52.0, 40.0, 61.0, 44.0, 40.0, 34.0, 16.0, 19.0, 14.0, 10.0, 14.0, 6.0, 3.0, 7.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.37102699279785, -28.486143112182617, -27.601259231567383, -26.71637535095215, -25.83148956298828, -24.946605682373047, -24.061721801757812, -23.176837921142578, -22.291954040527344, -21.40707015991211, -20.522186279296875, -19.63730239868164, -18.752418518066406, -17.867534637451172, -16.982648849487305, -16.09776496887207, -15.212881088256836, -14.327997207641602, -13.443113327026367, -12.558228492736816, -11.673344612121582, -10.788460731506348, -9.903575897216797, -9.018692016601562, -8.133808135986328, -7.248924255371094, -6.364039897918701, -5.479155540466309, -4.594271659851074, -3.70938777923584, -2.8245034217834473, -1.9396190643310547, -1.0547332763671875, -0.16984915733337402, 0.7150349617004395, 1.599919080734253, 2.4848031997680664, 3.369687080383301, 4.254571437835693, 5.139455795288086, 6.02433967590332, 6.909223556518555, 7.794107913970947, 8.67899227142334, 9.563876152038574, 10.448760032653809, 11.33364486694336, 12.218528747558594, 13.103412628173828, 13.988296508789062, 14.873180389404297, 15.758065223693848, 16.642948150634766, 17.52783203125, 18.412717819213867, 19.2976016998291, 20.182485580444336, 21.06736946105957, 21.952253341674805, 22.83713722229004, 23.722023010253906, 24.60690689086914, 25.491790771484375, 26.37667465209961, 27.261558532714844]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 11.0, 6.0, 15.0, 31.0, 25.0, 60.0, 85.0, 136.0, 261.0, 494.0, 1091.0, 2517.0, 5991.0, 19358.0, 84212.0, 499382.0, 350720.0, 60493.0, 14823.0, 4825.0, 2057.0, 887.0, 463.0, 229.0, 113.0, 82.0, 56.0, 35.0, 30.0, 27.0, 10.0, 9.0, 7.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.125, -42.8232421875, -41.521484375, -40.2197265625, -38.91796875, -37.6162109375, -36.314453125, -35.0126953125, -33.7109375, -32.4091796875, -31.107421875, -29.8056640625, -28.50390625, -27.2021484375, -25.900390625, -24.5986328125, -23.296875, -21.9951171875, -20.693359375, -19.3916015625, -18.08984375, -16.7880859375, -15.486328125, -14.1845703125, -12.8828125, -11.5810546875, -10.279296875, -8.9775390625, -7.67578125, -6.3740234375, -5.072265625, -3.7705078125, -2.46875, -1.1669921875, 0.134765625, 1.4365234375, 2.73828125, 4.0400390625, 5.341796875, 6.6435546875, 7.9453125, 9.2470703125, 10.548828125, 11.8505859375, 13.15234375, 14.4541015625, 15.755859375, 17.0576171875, 18.359375, 19.6611328125, 20.962890625, 22.2646484375, 23.56640625, 24.8681640625, 26.169921875, 27.4716796875, 28.7734375, 30.0751953125, 31.376953125, 32.6787109375, 33.98046875, 35.2822265625, 36.583984375, 37.8857421875, 39.1875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 1.0, 2.0, 4.0, 10.0, 11.0, 19.0, 36.0, 45.0, 59.0, 79.0, 79.0, 75.0, 106.0, 102.0, 94.0, 61.0, 62.0, 51.0, 44.0, 10.0, 19.0, 7.0, 8.0, 4.0, 1.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.27734375, -3.13232421875, -2.9873046875, -2.84228515625, -2.697265625, -2.55224609375, -2.4072265625, -2.26220703125, -2.1171875, -1.97216796875, -1.8271484375, -1.68212890625, -1.537109375, -1.39208984375, -1.2470703125, -1.10205078125, -0.95703125, -0.81201171875, -0.6669921875, -0.52197265625, -0.376953125, -0.23193359375, -0.0869140625, 0.05810546875, 0.203125, 0.34814453125, 0.4931640625, 0.63818359375, 0.783203125, 0.92822265625, 1.0732421875, 1.21826171875, 1.36328125, 1.50830078125, 1.6533203125, 1.79833984375, 1.943359375, 2.08837890625, 2.2333984375, 2.37841796875, 2.5234375, 2.66845703125, 2.8134765625, 2.95849609375, 3.103515625, 3.24853515625, 3.3935546875, 3.53857421875, 3.68359375, 3.82861328125, 3.9736328125, 4.11865234375, 4.263671875, 4.40869140625, 4.5537109375, 4.69873046875, 4.84375, 4.98876953125, 5.1337890625, 5.27880859375, 5.423828125, 5.56884765625, 5.7138671875, 5.85888671875, 6.00390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 14.0, 18.0, 32.0, 34.0, 53.0, 79.0, 131.0, 216.0, 355.0, 672.0, 1226.0, 2699.0, 6851.0, 18988.0, 68136.0, 329450.0, 475961.0, 101930.0, 26267.0, 8582.0, 3413.0, 1533.0, 735.0, 437.0, 244.0, 158.0, 108.0, 54.0, 56.0, 32.0, 29.0, 14.0, 11.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.783935546875, -21.97412109375, -21.164306640625, -20.3544921875, -19.544677734375, -18.73486328125, -17.925048828125, -17.115234375, -16.305419921875, -15.49560546875, -14.685791015625, -13.8759765625, -13.066162109375, -12.25634765625, -11.446533203125, -10.63671875, -9.826904296875, -9.01708984375, -8.207275390625, -7.3974609375, -6.587646484375, -5.77783203125, -4.968017578125, -4.158203125, -3.348388671875, -2.53857421875, -1.728759765625, -0.9189453125, -0.109130859375, 0.70068359375, 1.510498046875, 2.3203125, 3.130126953125, 3.93994140625, 4.749755859375, 5.5595703125, 6.369384765625, 7.17919921875, 7.989013671875, 8.798828125, 9.608642578125, 10.41845703125, 11.228271484375, 12.0380859375, 12.847900390625, 13.65771484375, 14.467529296875, 15.27734375, 16.087158203125, 16.89697265625, 17.706787109375, 18.5166015625, 19.326416015625, 20.13623046875, 20.946044921875, 21.755859375, 22.565673828125, 23.37548828125, 24.185302734375, 24.9951171875, 25.804931640625, 26.61474609375, 27.424560546875, 28.234375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 11.0, 9.0, 6.0, 17.0, 29.0, 21.0, 27.0, 40.0, 43.0, 55.0, 58.0, 50.0, 72.0, 68.0, 54.0, 56.0, 59.0, 55.0, 48.0, 45.0, 40.0, 30.0, 27.0, 17.0, 14.0, 8.0, 11.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.875, -14.3927001953125, -13.910400390625, -13.4281005859375, -12.94580078125, -12.4635009765625, -11.981201171875, -11.4989013671875, -11.0166015625, -10.5343017578125, -10.052001953125, -9.5697021484375, -9.08740234375, -8.6051025390625, -8.122802734375, -7.6405029296875, -7.158203125, -6.6759033203125, -6.193603515625, -5.7113037109375, -5.22900390625, -4.7467041015625, -4.264404296875, -3.7821044921875, -3.2998046875, -2.8175048828125, -2.335205078125, -1.8529052734375, -1.37060546875, -0.8883056640625, -0.406005859375, 0.0762939453125, 0.55859375, 1.0408935546875, 1.523193359375, 2.0054931640625, 2.48779296875, 2.9700927734375, 3.452392578125, 3.9346923828125, 4.4169921875, 4.8992919921875, 5.381591796875, 5.8638916015625, 6.34619140625, 6.8284912109375, 7.310791015625, 7.7930908203125, 8.275390625, 8.7576904296875, 9.239990234375, 9.7222900390625, 10.20458984375, 10.6868896484375, 11.169189453125, 11.6514892578125, 12.1337890625, 12.6160888671875, 13.098388671875, 13.5806884765625, 14.06298828125, 14.5452880859375, 15.027587890625, 15.5098876953125, 15.9921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 7.0, 7.0, 6.0, 9.0, 14.0, 14.0, 16.0, 42.0, 60.0, 57.0, 106.0, 148.0, 228.0, 374.0, 628.0, 1068.0, 1938.0, 3723.0, 7858.0, 17829.0, 48304.0, 165256.0, 477794.0, 221199.0, 61177.0, 21799.0, 9187.0, 4436.0, 2205.0, 1213.0, 678.0, 364.0, 276.0, 183.0, 100.0, 68.0, 41.0, 45.0, 26.0, 17.0, 17.0, 12.0, 6.0, 5.0, 3.0, 4.0, 5.0, 0.0, 5.0, 2.0, 1.0], "bins": [-27.078125, -26.317626953125, -25.55712890625, -24.796630859375, -24.0361328125, -23.275634765625, -22.51513671875, -21.754638671875, -20.994140625, -20.233642578125, -19.47314453125, -18.712646484375, -17.9521484375, -17.191650390625, -16.43115234375, -15.670654296875, -14.91015625, -14.149658203125, -13.38916015625, -12.628662109375, -11.8681640625, -11.107666015625, -10.34716796875, -9.586669921875, -8.826171875, -8.065673828125, -7.30517578125, -6.544677734375, -5.7841796875, -5.023681640625, -4.26318359375, -3.502685546875, -2.7421875, -1.981689453125, -1.22119140625, -0.460693359375, 0.2998046875, 1.060302734375, 1.82080078125, 2.581298828125, 3.341796875, 4.102294921875, 4.86279296875, 5.623291015625, 6.3837890625, 7.144287109375, 7.90478515625, 8.665283203125, 9.42578125, 10.186279296875, 10.94677734375, 11.707275390625, 12.4677734375, 13.228271484375, 13.98876953125, 14.749267578125, 15.509765625, 16.270263671875, 17.03076171875, 17.791259765625, 18.5517578125, 19.312255859375, 20.07275390625, 20.833251953125, 21.59375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 11.0, 10.0, 16.0, 31.0, 36.0, 62.0, 99.0, 157.0, 171.0, 125.0, 87.0, 64.0, 52.0, 23.0, 12.0, 13.0, 9.0, 1.0, 4.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003108978271484375, -0.0030025839805603027, -0.0028961896896362305, -0.002789795398712158, -0.002683401107788086, -0.0025770068168640137, -0.0024706125259399414, -0.002364218235015869, -0.002257823944091797, -0.0021514296531677246, -0.0020450353622436523, -0.00193864107131958, -0.0018322467803955078, -0.0017258524894714355, -0.0016194581985473633, -0.001513063907623291, -0.0014066696166992188, -0.0013002753257751465, -0.0011938810348510742, -0.001087486743927002, -0.0009810924530029297, -0.0008746981620788574, -0.0007683038711547852, -0.0006619095802307129, -0.0005555152893066406, -0.00044912099838256836, -0.0003427267074584961, -0.00023633241653442383, -0.00012993812561035156, -2.3543834686279297e-05, 8.285045623779297e-05, 0.00018924474716186523, 0.0002956390380859375, 0.00040203332901000977, 0.000508427619934082, 0.0006148219108581543, 0.0007212162017822266, 0.0008276104927062988, 0.0009340047836303711, 0.0010403990745544434, 0.0011467933654785156, 0.0012531876564025879, 0.0013595819473266602, 0.0014659762382507324, 0.0015723705291748047, 0.001678764820098877, 0.0017851591110229492, 0.0018915534019470215, 0.0019979476928710938, 0.002104341983795166, 0.0022107362747192383, 0.0023171305656433105, 0.002423524856567383, 0.002529919147491455, 0.0026363134384155273, 0.0027427077293395996, 0.002849102020263672, 0.002955496311187744, 0.0030618906021118164, 0.0031682848930358887, 0.003274679183959961, 0.003381073474884033, 0.0034874677658081055, 0.0035938620567321777, 0.00370025634765625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 3.0, 8.0, 18.0, 6.0, 23.0, 23.0, 45.0, 77.0, 101.0, 157.0, 259.0, 393.0, 697.0, 1210.0, 2430.0, 4856.0, 11128.0, 29000.0, 96094.0, 403275.0, 365593.0, 86136.0, 26745.0, 10379.0, 4664.0, 2282.0, 1201.0, 671.0, 406.0, 225.0, 138.0, 92.0, 67.0, 47.0, 27.0, 20.0, 15.0, 10.0, 9.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.09375, -23.28955078125, -22.4853515625, -21.68115234375, -20.876953125, -20.07275390625, -19.2685546875, -18.46435546875, -17.66015625, -16.85595703125, -16.0517578125, -15.24755859375, -14.443359375, -13.63916015625, -12.8349609375, -12.03076171875, -11.2265625, -10.42236328125, -9.6181640625, -8.81396484375, -8.009765625, -7.20556640625, -6.4013671875, -5.59716796875, -4.79296875, -3.98876953125, -3.1845703125, -2.38037109375, -1.576171875, -0.77197265625, 0.0322265625, 0.83642578125, 1.640625, 2.44482421875, 3.2490234375, 4.05322265625, 4.857421875, 5.66162109375, 6.4658203125, 7.27001953125, 8.07421875, 8.87841796875, 9.6826171875, 10.48681640625, 11.291015625, 12.09521484375, 12.8994140625, 13.70361328125, 14.5078125, 15.31201171875, 16.1162109375, 16.92041015625, 17.724609375, 18.52880859375, 19.3330078125, 20.13720703125, 20.94140625, 21.74560546875, 22.5498046875, 23.35400390625, 24.158203125, 24.96240234375, 25.7666015625, 26.57080078125, 27.375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 11.0, 10.0, 11.0, 19.0, 20.0, 25.0, 25.0, 29.0, 38.0, 46.0, 57.0, 53.0, 66.0, 79.0, 69.0, 72.0, 53.0, 53.0, 43.0, 40.0, 33.0, 34.0, 16.0, 13.0, 14.0, 7.0, 12.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -10.9234619140625, -10.518798828125, -10.1141357421875, -9.70947265625, -9.3048095703125, -8.900146484375, -8.4954833984375, -8.0908203125, -7.6861572265625, -7.281494140625, -6.8768310546875, -6.47216796875, -6.0675048828125, -5.662841796875, -5.2581787109375, -4.853515625, -4.4488525390625, -4.044189453125, -3.6395263671875, -3.23486328125, -2.8302001953125, -2.425537109375, -2.0208740234375, -1.6162109375, -1.2115478515625, -0.806884765625, -0.4022216796875, 0.00244140625, 0.4071044921875, 0.811767578125, 1.2164306640625, 1.62109375, 2.0257568359375, 2.430419921875, 2.8350830078125, 3.23974609375, 3.6444091796875, 4.049072265625, 4.4537353515625, 4.8583984375, 5.2630615234375, 5.667724609375, 6.0723876953125, 6.47705078125, 6.8817138671875, 7.286376953125, 7.6910400390625, 8.095703125, 8.5003662109375, 8.905029296875, 9.3096923828125, 9.71435546875, 10.1190185546875, 10.523681640625, 10.9283447265625, 11.3330078125, 11.7376708984375, 12.142333984375, 12.5469970703125, 12.95166015625, 13.3563232421875, 13.760986328125, 14.1656494140625, 14.5703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 35.0, 145.0, 359.0, 307.0, 78.0, 30.0, 24.0, 9.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.84410095214844, -149.30491638183594, -137.7657470703125, -126.2265625, -114.6873779296875, -103.148193359375, -91.60901641845703, -80.06983947753906, -68.53065490722656, -56.99147415161133, -45.452293395996094, -33.91311264038086, -22.373931884765625, -10.83475112915039, 0.7044296264648438, 12.243606567382812, 23.782791137695312, 35.32197189331055, 46.86115264892578, 58.400333404541016, 69.93951416015625, 81.47869873046875, 93.01787567138672, 104.55705261230469, 116.09623718261719, 127.63542175292969, 139.17459106445312, 150.71377563476562, 162.25296020507812, 173.79214477539062, 185.33132934570312, 196.87049865722656, 208.40966796875, 219.9488525390625, 231.488037109375, 243.02720642089844, 254.56639099121094, 266.1055603027344, 277.6447448730469, 289.1839294433594, 300.7231140136719, 312.2622985839844, 323.8014831542969, 335.3406677246094, 346.87982177734375, 358.41900634765625, 369.95819091796875, 381.49737548828125, 393.03656005859375, 404.57574462890625, 416.11492919921875, 427.65411376953125, 439.19329833984375, 450.7324523925781, 462.2716369628906, 473.8108215332031, 485.3500061035156, 496.8891906738281, 508.4283752441406, 519.967529296875, 531.5067138671875, 543.0458984375, 554.5850830078125, 566.124267578125, 577.6634521484375]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 2.0, 6.0, 1.0, 4.0, 6.0, 7.0, 11.0, 16.0, 15.0, 25.0, 23.0, 29.0, 36.0, 33.0, 47.0, 64.0, 65.0, 67.0, 50.0, 58.0, 70.0, 60.0, 57.0, 56.0, 39.0, 34.0, 31.0, 14.0, 10.0, 12.0, 10.0, 7.0, 9.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.30193328857422, -82.23118591308594, -79.16043853759766, -76.08969116210938, -73.01893615722656, -69.94818878173828, -66.87744140625, -63.80669403076172, -60.73594284057617, -57.66519546508789, -54.594444274902344, -51.52369689941406, -48.45294952392578, -45.382198333740234, -42.31145095825195, -39.240699768066406, -36.169952392578125, -33.099205017089844, -30.028453826904297, -26.957706451416016, -23.8869571685791, -20.816207885742188, -17.745460510253906, -14.674711227416992, -11.603961944580078, -8.533212661743164, -5.462464332580566, -2.3917160034179688, 0.6790332794189453, 3.7497825622558594, 6.820529937744141, 9.891279220581055, 12.962020874023438, 16.03277015686035, 19.103519439697266, 22.174266815185547, 25.24501609802246, 28.315765380859375, 31.386512756347656, 34.45726013183594, 37.528011322021484, 40.598758697509766, 43.66950988769531, 46.740257263183594, 49.811004638671875, 52.88175582885742, 55.9525032043457, 59.02325439453125, 62.09400177001953, 65.16474914550781, 68.2354965209961, 71.30624389648438, 74.37699890136719, 77.44774627685547, 80.51849365234375, 83.58924102783203, 86.65998840332031, 89.7307357788086, 92.80148315429688, 95.87223815917969, 98.94298553466797, 102.01373291015625, 105.08448028564453, 108.15522766113281, 111.22598266601562]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 0.0, 2.0, 6.0, 4.0, 19.0, 19.0, 23.0, 40.0, 64.0, 102.0, 142.0, 240.0, 429.0, 738.0, 1305.0, 2672.0, 6185.0, 15721.0, 51130.0, 270382.0, 3471573.0, 290656.0, 54248.0, 16697.0, 6283.0, 2704.0, 1230.0, 617.0, 404.0, 228.0, 136.0, 84.0, 56.0, 38.0, 39.0, 16.0, 17.0, 6.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-67.875, -66.01611328125, -64.1572265625, -62.29833984375, -60.439453125, -58.58056640625, -56.7216796875, -54.86279296875, -53.00390625, -51.14501953125, -49.2861328125, -47.42724609375, -45.568359375, -43.70947265625, -41.8505859375, -39.99169921875, -38.1328125, -36.27392578125, -34.4150390625, -32.55615234375, -30.697265625, -28.83837890625, -26.9794921875, -25.12060546875, -23.26171875, -21.40283203125, -19.5439453125, -17.68505859375, -15.826171875, -13.96728515625, -12.1083984375, -10.24951171875, -8.390625, -6.53173828125, -4.6728515625, -2.81396484375, -0.955078125, 0.90380859375, 2.7626953125, 4.62158203125, 6.48046875, 8.33935546875, 10.1982421875, 12.05712890625, 13.916015625, 15.77490234375, 17.6337890625, 19.49267578125, 21.3515625, 23.21044921875, 25.0693359375, 26.92822265625, 28.787109375, 30.64599609375, 32.5048828125, 34.36376953125, 36.22265625, 38.08154296875, 39.9404296875, 41.79931640625, 43.658203125, 45.51708984375, 47.3759765625, 49.23486328125, 51.09375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 4.0, 5.0, 7.0, 13.0, 12.0, 25.0, 29.0, 40.0, 46.0, 56.0, 56.0, 80.0, 85.0, 91.0, 89.0, 78.0, 57.0, 49.0, 36.0, 42.0, 30.0, 24.0, 13.0, 6.0, 9.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09765625, -2.97515869140625, -2.8526611328125, -2.73016357421875, -2.607666015625, -2.48516845703125, -2.3626708984375, -2.24017333984375, -2.11767578125, -1.99517822265625, -1.8726806640625, -1.75018310546875, -1.627685546875, -1.50518798828125, -1.3826904296875, -1.26019287109375, -1.1376953125, -1.01519775390625, -0.8927001953125, -0.77020263671875, -0.647705078125, -0.52520751953125, -0.4027099609375, -0.28021240234375, -0.15771484375, -0.03521728515625, 0.0872802734375, 0.20977783203125, 0.332275390625, 0.45477294921875, 0.5772705078125, 0.69976806640625, 0.822265625, 0.94476318359375, 1.0672607421875, 1.18975830078125, 1.312255859375, 1.43475341796875, 1.5572509765625, 1.67974853515625, 1.80224609375, 1.92474365234375, 2.0472412109375, 2.16973876953125, 2.292236328125, 2.41473388671875, 2.5372314453125, 2.65972900390625, 2.7822265625, 2.90472412109375, 3.0272216796875, 3.14971923828125, 3.272216796875, 3.39471435546875, 3.5172119140625, 3.63970947265625, 3.76220703125, 3.88470458984375, 4.0072021484375, 4.12969970703125, 4.252197265625, 4.37469482421875, 4.4971923828125, 4.61968994140625, 4.7421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 9.0, 11.0, 7.0, 15.0, 12.0, 25.0, 26.0, 43.0, 56.0, 85.0, 163.0, 265.0, 570.0, 1373.0, 3953.0, 14455.0, 82214.0, 1189914.0, 2766463.0, 109169.0, 17875.0, 4634.0, 1573.0, 612.0, 281.0, 153.0, 100.0, 56.0, 39.0, 28.0, 32.0, 16.0, 9.0, 9.0, 4.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.125, -66.7470703125, -64.369140625, -61.9912109375, -59.61328125, -57.2353515625, -54.857421875, -52.4794921875, -50.1015625, -47.7236328125, -45.345703125, -42.9677734375, -40.58984375, -38.2119140625, -35.833984375, -33.4560546875, -31.078125, -28.7001953125, -26.322265625, -23.9443359375, -21.56640625, -19.1884765625, -16.810546875, -14.4326171875, -12.0546875, -9.6767578125, -7.298828125, -4.9208984375, -2.54296875, -0.1650390625, 2.212890625, 4.5908203125, 6.96875, 9.3466796875, 11.724609375, 14.1025390625, 16.48046875, 18.8583984375, 21.236328125, 23.6142578125, 25.9921875, 28.3701171875, 30.748046875, 33.1259765625, 35.50390625, 37.8818359375, 40.259765625, 42.6376953125, 45.015625, 47.3935546875, 49.771484375, 52.1494140625, 54.52734375, 56.9052734375, 59.283203125, 61.6611328125, 64.0390625, 66.4169921875, 68.794921875, 71.1728515625, 73.55078125, 75.9287109375, 78.306640625, 80.6845703125, 83.0625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 18.0, 13.0, 19.0, 18.0, 47.0, 51.0, 70.0, 88.0, 118.0, 173.0, 227.0, 354.0, 1095.0, 620.0, 298.0, 228.0, 168.0, 121.0, 72.0, 73.0, 39.0, 30.0, 17.0, 26.0, 13.0, 14.0, 8.0, 6.0, 7.0, 8.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.6561279296875, -6.433349609375, -6.2105712890625, -5.98779296875, -5.7650146484375, -5.542236328125, -5.3194580078125, -5.0966796875, -4.8739013671875, -4.651123046875, -4.4283447265625, -4.20556640625, -3.9827880859375, -3.760009765625, -3.5372314453125, -3.314453125, -3.0916748046875, -2.868896484375, -2.6461181640625, -2.42333984375, -2.2005615234375, -1.977783203125, -1.7550048828125, -1.5322265625, -1.3094482421875, -1.086669921875, -0.8638916015625, -0.64111328125, -0.4183349609375, -0.195556640625, 0.0272216796875, 0.25, 0.4727783203125, 0.695556640625, 0.9183349609375, 1.14111328125, 1.3638916015625, 1.586669921875, 1.8094482421875, 2.0322265625, 2.2550048828125, 2.477783203125, 2.7005615234375, 2.92333984375, 3.1461181640625, 3.368896484375, 3.5916748046875, 3.814453125, 4.0372314453125, 4.260009765625, 4.4827880859375, 4.70556640625, 4.9283447265625, 5.151123046875, 5.3739013671875, 5.5966796875, 5.8194580078125, 6.042236328125, 6.2650146484375, 6.48779296875, 6.7105712890625, 6.933349609375, 7.1561279296875, 7.37890625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 10.0, 57.0, 165.0, 435.0, 245.0, 59.0, 26.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.42633056640625, -113.62159729003906, -107.8168716430664, -102.01214599609375, -96.20741271972656, -90.40267944335938, -84.59795379638672, -78.79322814941406, -72.98849487304688, -67.18376159667969, -61.37903594970703, -55.57430648803711, -49.76957702636719, -43.964847564697266, -38.160118103027344, -32.35538864135742, -26.5506591796875, -20.745929718017578, -14.941200256347656, -9.136470794677734, -3.3317413330078125, 2.4729881286621094, 8.277717590332031, 14.082447052001953, 19.887176513671875, 25.691905975341797, 31.49663543701172, 37.30136489868164, 43.10609436035156, 48.910823822021484, 54.715553283691406, 60.52028274536133, 66.32501220703125, 72.12974548339844, 77.9344711303711, 83.73919677734375, 89.54393005371094, 95.34866333007812, 101.15338897705078, 106.95811462402344, 112.76284790039062, 118.56758117675781, 124.37230682373047, 130.17703247070312, 135.9817657470703, 141.7864990234375, 147.59121704101562, 153.3959503173828, 159.20068359375, 165.0054168701172, 170.81015014648438, 176.6148681640625, 182.4196014404297, 188.22433471679688, 194.029052734375, 199.8337860107422, 205.63851928710938, 211.44325256347656, 217.24798583984375, 223.05270385742188, 228.85743713378906, 234.66217041015625, 240.46688842773438, 246.27162170410156, 252.07635498046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 4.0, 12.0, 10.0, 8.0, 14.0, 20.0, 20.0, 30.0, 17.0, 32.0, 34.0, 30.0, 48.0, 32.0, 40.0, 39.0, 41.0, 44.0, 46.0, 46.0, 57.0, 38.0, 37.0, 44.0, 27.0, 29.0, 21.0, 25.0, 20.0, 26.0, 16.0, 12.0, 11.0, 11.0, 6.0, 8.0, 7.0, 7.0, 3.0, 1.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.201194763183594, -28.271142959594727, -27.341093063354492, -26.411041259765625, -25.48099136352539, -24.550939559936523, -23.620887756347656, -22.690837860107422, -21.760786056518555, -20.830734252929688, -19.900684356689453, -18.970632553100586, -18.04058265686035, -17.110530853271484, -16.18048095703125, -15.250429153442383, -14.320378303527832, -13.390327453613281, -12.46027660369873, -11.53022575378418, -10.600173950195312, -9.670123100280762, -8.740072250366211, -7.810020923614502, -6.879970073699951, -5.9499192237854, -5.019867897033691, -4.089817047119141, -3.1597659587860107, -2.229714870452881, -1.29966402053833, -0.3696126937866211, 0.5604381561279297, 1.4904892444610596, 2.4205403327941895, 3.3505911827087402, 4.280642509460449, 5.210693359375, 6.140744209289551, 7.07079553604126, 8.000846862792969, 8.93089771270752, 9.86094856262207, 10.791000366210938, 11.721051216125488, 12.651102066040039, 13.58115291595459, 14.51120376586914, 15.441254615783691, 16.371305465698242, 17.30135726928711, 18.231407165527344, 19.16145896911621, 20.091510772705078, 21.021560668945312, 21.95161247253418, 22.881662368774414, 23.81171417236328, 24.741764068603516, 25.671815872192383, 26.601865768432617, 27.531917572021484, 28.46196746826172, 29.392019271850586, 30.322071075439453]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 8.0, 7.0, 20.0, 26.0, 38.0, 45.0, 65.0, 66.0, 145.0, 177.0, 287.0, 426.0, 751.0, 1288.0, 2498.0, 5222.0, 11632.0, 29347.0, 78833.0, 214369.0, 380425.0, 200658.0, 73100.0, 27686.0, 10978.0, 4843.0, 2388.0, 1248.0, 673.0, 399.0, 288.0, 189.0, 113.0, 94.0, 68.0, 47.0, 33.0, 24.0, 16.0, 17.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.3125, -32.345947265625, -31.37939453125, -30.412841796875, -29.4462890625, -28.479736328125, -27.51318359375, -26.546630859375, -25.580078125, -24.613525390625, -23.64697265625, -22.680419921875, -21.7138671875, -20.747314453125, -19.78076171875, -18.814208984375, -17.84765625, -16.881103515625, -15.91455078125, -14.947998046875, -13.9814453125, -13.014892578125, -12.04833984375, -11.081787109375, -10.115234375, -9.148681640625, -8.18212890625, -7.215576171875, -6.2490234375, -5.282470703125, -4.31591796875, -3.349365234375, -2.3828125, -1.416259765625, -0.44970703125, 0.516845703125, 1.4833984375, 2.449951171875, 3.41650390625, 4.383056640625, 5.349609375, 6.316162109375, 7.28271484375, 8.249267578125, 9.2158203125, 10.182373046875, 11.14892578125, 12.115478515625, 13.08203125, 14.048583984375, 15.01513671875, 15.981689453125, 16.9482421875, 17.914794921875, 18.88134765625, 19.847900390625, 20.814453125, 21.781005859375, 22.74755859375, 23.714111328125, 24.6806640625, 25.647216796875, 26.61376953125, 27.580322265625, 28.546875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 2.0, 9.0, 16.0, 24.0, 28.0, 42.0, 47.0, 68.0, 69.0, 89.0, 85.0, 84.0, 76.0, 76.0, 62.0, 56.0, 33.0, 30.0, 27.0, 21.0, 13.0, 14.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21875, -3.0909423828125, -2.963134765625, -2.8353271484375, -2.70751953125, -2.5797119140625, -2.451904296875, -2.3240966796875, -2.1962890625, -2.0684814453125, -1.940673828125, -1.8128662109375, -1.68505859375, -1.5572509765625, -1.429443359375, -1.3016357421875, -1.173828125, -1.0460205078125, -0.918212890625, -0.7904052734375, -0.66259765625, -0.5347900390625, -0.406982421875, -0.2791748046875, -0.1513671875, -0.0235595703125, 0.104248046875, 0.2320556640625, 0.35986328125, 0.4876708984375, 0.615478515625, 0.7432861328125, 0.87109375, 0.9989013671875, 1.126708984375, 1.2545166015625, 1.38232421875, 1.5101318359375, 1.637939453125, 1.7657470703125, 1.8935546875, 2.0213623046875, 2.149169921875, 2.2769775390625, 2.40478515625, 2.5325927734375, 2.660400390625, 2.7882080078125, 2.916015625, 3.0438232421875, 3.171630859375, 3.2994384765625, 3.42724609375, 3.5550537109375, 3.682861328125, 3.8106689453125, 3.9384765625, 4.0662841796875, 4.194091796875, 4.3218994140625, 4.44970703125, 4.5775146484375, 4.705322265625, 4.8331298828125, 4.9609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 10.0, 9.0, 12.0, 14.0, 13.0, 26.0, 27.0, 43.0, 49.0, 83.0, 110.0, 168.0, 337.0, 539.0, 1127.0, 2530.0, 6620.0, 20189.0, 69282.0, 261674.0, 460632.0, 160004.0, 43250.0, 13289.0, 4673.0, 1840.0, 813.0, 456.0, 251.0, 126.0, 115.0, 68.0, 48.0, 34.0, 33.0, 17.0, 15.0, 5.0, 8.0, 8.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.71875, -36.474609375, -35.23046875, -33.986328125, -32.7421875, -31.498046875, -30.25390625, -29.009765625, -27.765625, -26.521484375, -25.27734375, -24.033203125, -22.7890625, -21.544921875, -20.30078125, -19.056640625, -17.8125, -16.568359375, -15.32421875, -14.080078125, -12.8359375, -11.591796875, -10.34765625, -9.103515625, -7.859375, -6.615234375, -5.37109375, -4.126953125, -2.8828125, -1.638671875, -0.39453125, 0.849609375, 2.09375, 3.337890625, 4.58203125, 5.826171875, 7.0703125, 8.314453125, 9.55859375, 10.802734375, 12.046875, 13.291015625, 14.53515625, 15.779296875, 17.0234375, 18.267578125, 19.51171875, 20.755859375, 22.0, 23.244140625, 24.48828125, 25.732421875, 26.9765625, 28.220703125, 29.46484375, 30.708984375, 31.953125, 33.197265625, 34.44140625, 35.685546875, 36.9296875, 38.173828125, 39.41796875, 40.662109375, 41.90625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 2.0, 7.0, 14.0, 13.0, 19.0, 16.0, 23.0, 29.0, 31.0, 33.0, 35.0, 45.0, 43.0, 62.0, 46.0, 54.0, 54.0, 51.0, 47.0, 58.0, 44.0, 33.0, 29.0, 33.0, 29.0, 26.0, 28.0, 16.0, 16.0, 10.0, 15.0, 8.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.212158203125, -15.64306640625, -15.073974609375, -14.5048828125, -13.935791015625, -13.36669921875, -12.797607421875, -12.228515625, -11.659423828125, -11.09033203125, -10.521240234375, -9.9521484375, -9.383056640625, -8.81396484375, -8.244873046875, -7.67578125, -7.106689453125, -6.53759765625, -5.968505859375, -5.3994140625, -4.830322265625, -4.26123046875, -3.692138671875, -3.123046875, -2.553955078125, -1.98486328125, -1.415771484375, -0.8466796875, -0.277587890625, 0.29150390625, 0.860595703125, 1.4296875, 1.998779296875, 2.56787109375, 3.136962890625, 3.7060546875, 4.275146484375, 4.84423828125, 5.413330078125, 5.982421875, 6.551513671875, 7.12060546875, 7.689697265625, 8.2587890625, 8.827880859375, 9.39697265625, 9.966064453125, 10.53515625, 11.104248046875, 11.67333984375, 12.242431640625, 12.8115234375, 13.380615234375, 13.94970703125, 14.518798828125, 15.087890625, 15.656982421875, 16.22607421875, 16.795166015625, 17.3642578125, 17.933349609375, 18.50244140625, 19.071533203125, 19.640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 11.0, 10.0, 22.0, 32.0, 43.0, 55.0, 107.0, 160.0, 317.0, 571.0, 1063.0, 2157.0, 4607.0, 10536.0, 27540.0, 83744.0, 298168.0, 417497.0, 134721.0, 40548.0, 14606.0, 6097.0, 2784.0, 1325.0, 712.0, 411.0, 220.0, 157.0, 102.0, 56.0, 37.0, 25.0, 23.0, 21.0, 17.0, 4.0, 8.0, 7.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-22.984375, -22.270263671875, -21.55615234375, -20.842041015625, -20.1279296875, -19.413818359375, -18.69970703125, -17.985595703125, -17.271484375, -16.557373046875, -15.84326171875, -15.129150390625, -14.4150390625, -13.700927734375, -12.98681640625, -12.272705078125, -11.55859375, -10.844482421875, -10.13037109375, -9.416259765625, -8.7021484375, -7.988037109375, -7.27392578125, -6.559814453125, -5.845703125, -5.131591796875, -4.41748046875, -3.703369140625, -2.9892578125, -2.275146484375, -1.56103515625, -0.846923828125, -0.1328125, 0.581298828125, 1.29541015625, 2.009521484375, 2.7236328125, 3.437744140625, 4.15185546875, 4.865966796875, 5.580078125, 6.294189453125, 7.00830078125, 7.722412109375, 8.4365234375, 9.150634765625, 9.86474609375, 10.578857421875, 11.29296875, 12.007080078125, 12.72119140625, 13.435302734375, 14.1494140625, 14.863525390625, 15.57763671875, 16.291748046875, 17.005859375, 17.719970703125, 18.43408203125, 19.148193359375, 19.8623046875, 20.576416015625, 21.29052734375, 22.004638671875, 22.71875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 6.0, 5.0, 8.0, 11.0, 12.0, 12.0, 20.0, 37.0, 50.0, 56.0, 65.0, 103.0, 94.0, 122.0, 84.0, 84.0, 69.0, 33.0, 32.0, 36.0, 19.0, 13.0, 8.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042266845703125, -0.0040991902351379395, -0.003971695899963379, -0.0038442015647888184, -0.003716707229614258, -0.0035892128944396973, -0.0034617185592651367, -0.003334224224090576, -0.0032067298889160156, -0.003079235553741455, -0.0029517412185668945, -0.002824246883392334, -0.0026967525482177734, -0.002569258213043213, -0.0024417638778686523, -0.002314269542694092, -0.0021867752075195312, -0.0020592808723449707, -0.0019317865371704102, -0.0018042922019958496, -0.001676797866821289, -0.0015493035316467285, -0.001421809196472168, -0.0012943148612976074, -0.0011668205261230469, -0.0010393261909484863, -0.0009118318557739258, -0.0007843375205993652, -0.0006568431854248047, -0.0005293488502502441, -0.0004018545150756836, -0.00027436017990112305, -0.0001468658447265625, -1.9371509552001953e-05, 0.0001081228256225586, 0.00023561716079711914, 0.0003631114959716797, 0.0004906058311462402, 0.0006181001663208008, 0.0007455945014953613, 0.0008730888366699219, 0.0010005831718444824, 0.001128077507019043, 0.0012555718421936035, 0.001383066177368164, 0.0015105605125427246, 0.0016380548477172852, 0.0017655491828918457, 0.0018930435180664062, 0.002020537853240967, 0.0021480321884155273, 0.002275526523590088, 0.0024030208587646484, 0.002530515193939209, 0.0026580095291137695, 0.00278550386428833, 0.0029129981994628906, 0.003040492534637451, 0.0031679868698120117, 0.0032954812049865723, 0.003422975540161133, 0.0035504698753356934, 0.003677964210510254, 0.0038054585456848145, 0.003932952880859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 3.0, 3.0, 8.0, 8.0, 9.0, 14.0, 23.0, 41.0, 71.0, 115.0, 233.0, 484.0, 973.0, 2617.0, 8691.0, 39710.0, 344976.0, 570037.0, 62339.0, 12252.0, 3512.0, 1293.0, 539.0, 253.0, 117.0, 92.0, 46.0, 31.0, 16.0, 17.0, 11.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-51.96875, -50.56884765625, -49.1689453125, -47.76904296875, -46.369140625, -44.96923828125, -43.5693359375, -42.16943359375, -40.76953125, -39.36962890625, -37.9697265625, -36.56982421875, -35.169921875, -33.77001953125, -32.3701171875, -30.97021484375, -29.5703125, -28.17041015625, -26.7705078125, -25.37060546875, -23.970703125, -22.57080078125, -21.1708984375, -19.77099609375, -18.37109375, -16.97119140625, -15.5712890625, -14.17138671875, -12.771484375, -11.37158203125, -9.9716796875, -8.57177734375, -7.171875, -5.77197265625, -4.3720703125, -2.97216796875, -1.572265625, -0.17236328125, 1.2275390625, 2.62744140625, 4.02734375, 5.42724609375, 6.8271484375, 8.22705078125, 9.626953125, 11.02685546875, 12.4267578125, 13.82666015625, 15.2265625, 16.62646484375, 18.0263671875, 19.42626953125, 20.826171875, 22.22607421875, 23.6259765625, 25.02587890625, 26.42578125, 27.82568359375, 29.2255859375, 30.62548828125, 32.025390625, 33.42529296875, 34.8251953125, 36.22509765625, 37.625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 13.0, 9.0, 13.0, 20.0, 16.0, 25.0, 51.0, 49.0, 73.0, 88.0, 118.0, 107.0, 103.0, 82.0, 63.0, 37.0, 26.0, 19.0, 21.0, 17.0, 9.0, 7.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.96875, -19.4305419921875, -18.892333984375, -18.3541259765625, -17.81591796875, -17.2777099609375, -16.739501953125, -16.2012939453125, -15.6630859375, -15.1248779296875, -14.586669921875, -14.0484619140625, -13.51025390625, -12.9720458984375, -12.433837890625, -11.8956298828125, -11.357421875, -10.8192138671875, -10.281005859375, -9.7427978515625, -9.20458984375, -8.6663818359375, -8.128173828125, -7.5899658203125, -7.0517578125, -6.5135498046875, -5.975341796875, -5.4371337890625, -4.89892578125, -4.3607177734375, -3.822509765625, -3.2843017578125, -2.74609375, -2.2078857421875, -1.669677734375, -1.1314697265625, -0.59326171875, -0.0550537109375, 0.483154296875, 1.0213623046875, 1.5595703125, 2.0977783203125, 2.635986328125, 3.1741943359375, 3.71240234375, 4.2506103515625, 4.788818359375, 5.3270263671875, 5.865234375, 6.4034423828125, 6.941650390625, 7.4798583984375, 8.01806640625, 8.5562744140625, 9.094482421875, 9.6326904296875, 10.1708984375, 10.7091064453125, 11.247314453125, 11.7855224609375, 12.32373046875, 12.8619384765625, 13.400146484375, 13.9383544921875, 14.4765625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 12.0, 26.0, 62.0, 104.0, 183.0, 223.0, 169.0, 110.0, 54.0, 18.0, 12.0, 9.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-378.73016357421875, -367.71539306640625, -356.70062255859375, -345.6858215332031, -334.6710510253906, -323.6562805175781, -312.6414794921875, -301.626708984375, -290.6119384765625, -279.59716796875, -268.5823974609375, -257.5675964355469, -246.55282592773438, -235.53805541992188, -224.5232696533203, -213.50848388671875, -202.49371337890625, -191.47894287109375, -180.4641571044922, -169.44937133789062, -158.43460083007812, -147.41983032226562, -136.40504455566406, -125.39026641845703, -114.37548828125, -103.36071014404297, -92.34593200683594, -81.3311538696289, -70.31637573242188, -59.301597595214844, -48.28681945800781, -37.27204132080078, -26.257232666015625, -15.242454528808594, -4.2276763916015625, 6.787101745605469, 17.8018798828125, 28.81665802001953, 39.83143615722656, 50.846214294433594, 61.860992431640625, 72.87577056884766, 83.89054870605469, 94.90532684326172, 105.92010498046875, 116.93488311767578, 127.94966125488281, 138.96444702148438, 149.97921752929688, 160.99398803710938, 172.00877380371094, 183.0235595703125, 194.038330078125, 205.0531005859375, 216.06788635253906, 227.08267211914062, 238.09744262695312, 249.11221313476562, 260.12701416015625, 271.14178466796875, 282.15655517578125, 293.17132568359375, 304.18609619140625, 315.2008972167969, 326.2156677246094]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 11.0, 12.0, 18.0, 19.0, 25.0, 18.0, 15.0, 31.0, 28.0, 49.0, 49.0, 43.0, 56.0, 26.0, 47.0, 54.0, 41.0, 50.0, 34.0, 45.0, 39.0, 38.0, 43.0, 29.0, 22.0, 26.0, 20.0, 11.0, 16.0, 10.0, 9.0, 8.0, 8.0, 8.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-133.895263671875, -130.08030700683594, -126.2653579711914, -122.45040130615234, -118.63545227050781, -114.82049560546875, -111.00553894042969, -107.19058990478516, -103.37564086914062, -99.56068420410156, -95.74573516845703, -91.93077850341797, -88.11582946777344, -84.30087280273438, -80.48591613769531, -76.67096710205078, -72.85601043701172, -69.04105377197266, -65.22610473632812, -61.41114807128906, -57.59619903564453, -53.78124237060547, -49.96628952026367, -46.151336669921875, -42.33638381958008, -38.52143096923828, -34.706478118896484, -30.891523361206055, -27.076570510864258, -23.26161766052246, -19.44666290283203, -15.631710052490234, -11.816764831542969, -8.001811981201172, -4.186858177185059, -0.3719043731689453, 3.4430484771728516, 7.258001327514648, 11.072956085205078, 14.887908935546875, 18.702861785888672, 22.51781463623047, 26.332767486572266, 30.147722244262695, 33.962677001953125, 37.777626037597656, 41.59258270263672, 45.407535552978516, 49.22248840332031, 53.03744125366211, 56.852394104003906, 60.66735076904297, 64.4822998046875, 68.29725646972656, 72.11221313476562, 75.92716217041016, 79.74211120605469, 83.55706787109375, 87.37201690673828, 91.18697357177734, 95.00192260742188, 98.81687927246094, 102.6318359375, 106.44678497314453, 110.2617416381836]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 5.0, 9.0, 15.0, 21.0, 20.0, 30.0, 46.0, 62.0, 78.0, 121.0, 172.0, 243.0, 390.0, 638.0, 1051.0, 1938.0, 3712.0, 8289.0, 21419.0, 68032.0, 337218.0, 3383230.0, 270800.0, 61660.0, 20071.0, 7884.0, 3433.0, 1649.0, 860.0, 440.0, 272.0, 165.0, 99.0, 60.0, 35.0, 36.0, 22.0, 22.0, 17.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.375, -53.71923828125, -52.0634765625, -50.40771484375, -48.751953125, -47.09619140625, -45.4404296875, -43.78466796875, -42.12890625, -40.47314453125, -38.8173828125, -37.16162109375, -35.505859375, -33.85009765625, -32.1943359375, -30.53857421875, -28.8828125, -27.22705078125, -25.5712890625, -23.91552734375, -22.259765625, -20.60400390625, -18.9482421875, -17.29248046875, -15.63671875, -13.98095703125, -12.3251953125, -10.66943359375, -9.013671875, -7.35791015625, -5.7021484375, -4.04638671875, -2.390625, -0.73486328125, 0.9208984375, 2.57666015625, 4.232421875, 5.88818359375, 7.5439453125, 9.19970703125, 10.85546875, 12.51123046875, 14.1669921875, 15.82275390625, 17.478515625, 19.13427734375, 20.7900390625, 22.44580078125, 24.1015625, 25.75732421875, 27.4130859375, 29.06884765625, 30.724609375, 32.38037109375, 34.0361328125, 35.69189453125, 37.34765625, 39.00341796875, 40.6591796875, 42.31494140625, 43.970703125, 45.62646484375, 47.2822265625, 48.93798828125, 50.59375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 4.0, 8.0, 16.0, 19.0, 27.0, 36.0, 43.0, 46.0, 60.0, 69.0, 78.0, 63.0, 73.0, 69.0, 77.0, 60.0, 42.0, 45.0, 32.0, 29.0, 29.0, 12.0, 16.0, 9.0, 12.0, 2.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91796875, -3.77362060546875, -3.6292724609375, -3.48492431640625, -3.340576171875, -3.19622802734375, -3.0518798828125, -2.90753173828125, -2.76318359375, -2.61883544921875, -2.4744873046875, -2.33013916015625, -2.185791015625, -2.04144287109375, -1.8970947265625, -1.75274658203125, -1.6083984375, -1.46405029296875, -1.3197021484375, -1.17535400390625, -1.031005859375, -0.88665771484375, -0.7423095703125, -0.59796142578125, -0.45361328125, -0.30926513671875, -0.1649169921875, -0.02056884765625, 0.123779296875, 0.26812744140625, 0.4124755859375, 0.55682373046875, 0.701171875, 0.84552001953125, 0.9898681640625, 1.13421630859375, 1.278564453125, 1.42291259765625, 1.5672607421875, 1.71160888671875, 1.85595703125, 2.00030517578125, 2.1446533203125, 2.28900146484375, 2.433349609375, 2.57769775390625, 2.7220458984375, 2.86639404296875, 3.0107421875, 3.15509033203125, 3.2994384765625, 3.44378662109375, 3.588134765625, 3.73248291015625, 3.8768310546875, 4.02117919921875, 4.16552734375, 4.30987548828125, 4.4542236328125, 4.59857177734375, 4.742919921875, 4.88726806640625, 5.0316162109375, 5.17596435546875, 5.3203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 20.0, 15.0, 22.0, 53.0, 69.0, 130.0, 194.0, 337.0, 571.0, 1116.0, 2436.0, 5544.0, 14333.0, 43011.0, 168149.0, 2431916.0, 1315696.0, 148499.0, 39227.0, 13306.0, 5190.0, 2216.0, 1005.0, 516.0, 289.0, 153.0, 97.0, 40.0, 37.0, 21.0, 21.0, 14.0, 11.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.53125, -47.759765625, -45.98828125, -44.216796875, -42.4453125, -40.673828125, -38.90234375, -37.130859375, -35.359375, -33.587890625, -31.81640625, -30.044921875, -28.2734375, -26.501953125, -24.73046875, -22.958984375, -21.1875, -19.416015625, -17.64453125, -15.873046875, -14.1015625, -12.330078125, -10.55859375, -8.787109375, -7.015625, -5.244140625, -3.47265625, -1.701171875, 0.0703125, 1.841796875, 3.61328125, 5.384765625, 7.15625, 8.927734375, 10.69921875, 12.470703125, 14.2421875, 16.013671875, 17.78515625, 19.556640625, 21.328125, 23.099609375, 24.87109375, 26.642578125, 28.4140625, 30.185546875, 31.95703125, 33.728515625, 35.5, 37.271484375, 39.04296875, 40.814453125, 42.5859375, 44.357421875, 46.12890625, 47.900390625, 49.671875, 51.443359375, 53.21484375, 54.986328125, 56.7578125, 58.529296875, 60.30078125, 62.072265625, 63.84375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 17.0, 10.0, 23.0, 25.0, 39.0, 49.0, 53.0, 70.0, 133.0, 151.0, 267.0, 463.0, 1434.0, 448.0, 259.0, 169.0, 110.0, 80.0, 60.0, 44.0, 37.0, 28.0, 20.0, 14.0, 13.0, 16.0, 6.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.75, -12.40087890625, -12.0517578125, -11.70263671875, -11.353515625, -11.00439453125, -10.6552734375, -10.30615234375, -9.95703125, -9.60791015625, -9.2587890625, -8.90966796875, -8.560546875, -8.21142578125, -7.8623046875, -7.51318359375, -7.1640625, -6.81494140625, -6.4658203125, -6.11669921875, -5.767578125, -5.41845703125, -5.0693359375, -4.72021484375, -4.37109375, -4.02197265625, -3.6728515625, -3.32373046875, -2.974609375, -2.62548828125, -2.2763671875, -1.92724609375, -1.578125, -1.22900390625, -0.8798828125, -0.53076171875, -0.181640625, 0.16748046875, 0.5166015625, 0.86572265625, 1.21484375, 1.56396484375, 1.9130859375, 2.26220703125, 2.611328125, 2.96044921875, 3.3095703125, 3.65869140625, 4.0078125, 4.35693359375, 4.7060546875, 5.05517578125, 5.404296875, 5.75341796875, 6.1025390625, 6.45166015625, 6.80078125, 7.14990234375, 7.4990234375, 7.84814453125, 8.197265625, 8.54638671875, 8.8955078125, 9.24462890625, 9.59375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 8.0, 14.0, 10.0, 17.0, 23.0, 30.0, 46.0, 50.0, 69.0, 87.0, 106.0, 101.0, 90.0, 82.0, 63.0, 45.0, 35.0, 32.0, 20.0, 16.0, 12.0, 4.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-57.18735885620117, -55.36600112915039, -53.54464340209961, -51.72328186035156, -49.90192413330078, -48.08056640625, -46.25920867919922, -44.43785095214844, -42.61648941040039, -40.79513168334961, -38.97377395629883, -37.15241241455078, -35.3310546875, -33.50969696044922, -31.688339233398438, -29.866979598999023, -28.045621871948242, -26.22426414489746, -24.402904510498047, -22.581546783447266, -20.76018714904785, -18.93882942199707, -17.117469787597656, -15.296112060546875, -13.474753379821777, -11.65339469909668, -9.832036018371582, -8.010677337646484, -6.189319133758545, -4.3679609298706055, -2.546602249145508, -0.7252435684204102, 1.0961151123046875, 2.917473793029785, 4.738832473754883, 6.560190677642822, 8.381549835205078, 10.20290756225586, 12.024266242980957, 13.845624923706055, 15.666983604431152, 17.48834228515625, 19.30970001220703, 21.131059646606445, 22.952417373657227, 24.77377700805664, 26.595134735107422, 28.416492462158203, 30.237852096557617, 32.05921173095703, 33.88056945800781, 35.701927185058594, 37.523284912109375, 39.344642639160156, 41.1660041809082, 42.987361907958984, 44.808719635009766, 46.63007736206055, 48.45143508911133, 50.272796630859375, 52.094154357910156, 53.91551208496094, 55.73686981201172, 57.5582275390625, 59.37958908081055]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 11.0, 9.0, 8.0, 18.0, 11.0, 18.0, 25.0, 23.0, 31.0, 26.0, 30.0, 42.0, 32.0, 31.0, 50.0, 49.0, 42.0, 41.0, 57.0, 41.0, 50.0, 33.0, 38.0, 31.0, 29.0, 27.0, 29.0, 26.0, 26.0, 19.0, 16.0, 7.0, 12.0, 9.0, 6.0, 7.0, 11.0, 1.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-43.58074951171875, -42.231414794921875, -40.882076263427734, -39.53274154663086, -38.183406829833984, -36.83407211303711, -35.48473358154297, -34.135398864746094, -32.78606414794922, -31.43672752380371, -30.087392807006836, -28.738056182861328, -27.388721466064453, -26.039384841918945, -24.690048217773438, -23.340713500976562, -21.991376876831055, -20.642040252685547, -19.292705535888672, -17.943368911743164, -16.59403419494629, -15.244697570800781, -13.89536190032959, -12.546026229858398, -11.196690559387207, -9.847354888916016, -8.498019218444824, -7.148683071136475, -5.799347400665283, -4.450011730194092, -3.100675582885742, -1.7513399124145508, -0.4020042419433594, 0.9473315477371216, 2.2966673374176025, 3.646003246307373, 4.9953389167785645, 6.344674587249756, 7.6940107345581055, 9.043346405029297, 10.392682075500488, 11.74201774597168, 13.091353416442871, 14.440689086914062, 15.79002571105957, 17.139360427856445, 18.488697052001953, 19.838031768798828, 21.187368392944336, 22.536705017089844, 23.88603973388672, 25.235376358032227, 26.5847110748291, 27.93404769897461, 29.283382415771484, 30.632719039916992, 31.9820556640625, 33.331390380859375, 34.680728912353516, 36.03006362915039, 37.379398345947266, 38.72873306274414, 40.07807159423828, 41.427406311035156, 42.77674102783203]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 7.0, 7.0, 6.0, 8.0, 16.0, 18.0, 30.0, 41.0, 74.0, 77.0, 112.0, 186.0, 244.0, 361.0, 526.0, 871.0, 1405.0, 2308.0, 4192.0, 7831.0, 15966.0, 33910.0, 74963.0, 165963.0, 303664.0, 232084.0, 108473.0, 48541.0, 22378.0, 10713.0, 5633.0, 3095.0, 1709.0, 1052.0, 688.0, 434.0, 306.0, 206.0, 147.0, 91.0, 67.0, 48.0, 30.0, 17.0, 20.0, 10.0, 8.0, 3.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-25.3125, -24.48876953125, -23.6650390625, -22.84130859375, -22.017578125, -21.19384765625, -20.3701171875, -19.54638671875, -18.72265625, -17.89892578125, -17.0751953125, -16.25146484375, -15.427734375, -14.60400390625, -13.7802734375, -12.95654296875, -12.1328125, -11.30908203125, -10.4853515625, -9.66162109375, -8.837890625, -8.01416015625, -7.1904296875, -6.36669921875, -5.54296875, -4.71923828125, -3.8955078125, -3.07177734375, -2.248046875, -1.42431640625, -0.6005859375, 0.22314453125, 1.046875, 1.87060546875, 2.6943359375, 3.51806640625, 4.341796875, 5.16552734375, 5.9892578125, 6.81298828125, 7.63671875, 8.46044921875, 9.2841796875, 10.10791015625, 10.931640625, 11.75537109375, 12.5791015625, 13.40283203125, 14.2265625, 15.05029296875, 15.8740234375, 16.69775390625, 17.521484375, 18.34521484375, 19.1689453125, 19.99267578125, 20.81640625, 21.64013671875, 22.4638671875, 23.28759765625, 24.111328125, 24.93505859375, 25.7587890625, 26.58251953125, 27.40625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 11.0, 15.0, 19.0, 24.0, 29.0, 34.0, 45.0, 55.0, 48.0, 56.0, 69.0, 69.0, 53.0, 64.0, 59.0, 56.0, 51.0, 43.0, 37.0, 41.0, 25.0, 18.0, 6.0, 13.0, 6.0, 10.0, 4.0, 6.0, 1.0, 8.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15234375, -4.009521484375, -3.86669921875, -3.723876953125, -3.5810546875, -3.438232421875, -3.29541015625, -3.152587890625, -3.009765625, -2.866943359375, -2.72412109375, -2.581298828125, -2.4384765625, -2.295654296875, -2.15283203125, -2.010009765625, -1.8671875, -1.724365234375, -1.58154296875, -1.438720703125, -1.2958984375, -1.153076171875, -1.01025390625, -0.867431640625, -0.724609375, -0.581787109375, -0.43896484375, -0.296142578125, -0.1533203125, -0.010498046875, 0.13232421875, 0.275146484375, 0.41796875, 0.560791015625, 0.70361328125, 0.846435546875, 0.9892578125, 1.132080078125, 1.27490234375, 1.417724609375, 1.560546875, 1.703369140625, 1.84619140625, 1.989013671875, 2.1318359375, 2.274658203125, 2.41748046875, 2.560302734375, 2.703125, 2.845947265625, 2.98876953125, 3.131591796875, 3.2744140625, 3.417236328125, 3.56005859375, 3.702880859375, 3.845703125, 3.988525390625, 4.13134765625, 4.274169921875, 4.4169921875, 4.559814453125, 4.70263671875, 4.845458984375, 4.98828125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 4.0, 16.0, 24.0, 34.0, 50.0, 79.0, 107.0, 187.0, 325.0, 650.0, 1482.0, 3650.0, 10869.0, 38739.0, 164795.0, 548171.0, 210809.0, 48292.0, 12950.0, 4138.0, 1643.0, 704.0, 325.0, 193.0, 95.0, 66.0, 46.0, 37.0, 19.0, 14.0, 5.0, 5.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.53125, -46.8330078125, -45.134765625, -43.4365234375, -41.73828125, -40.0400390625, -38.341796875, -36.6435546875, -34.9453125, -33.2470703125, -31.548828125, -29.8505859375, -28.15234375, -26.4541015625, -24.755859375, -23.0576171875, -21.359375, -19.6611328125, -17.962890625, -16.2646484375, -14.56640625, -12.8681640625, -11.169921875, -9.4716796875, -7.7734375, -6.0751953125, -4.376953125, -2.6787109375, -0.98046875, 0.7177734375, 2.416015625, 4.1142578125, 5.8125, 7.5107421875, 9.208984375, 10.9072265625, 12.60546875, 14.3037109375, 16.001953125, 17.7001953125, 19.3984375, 21.0966796875, 22.794921875, 24.4931640625, 26.19140625, 27.8896484375, 29.587890625, 31.2861328125, 32.984375, 34.6826171875, 36.380859375, 38.0791015625, 39.77734375, 41.4755859375, 43.173828125, 44.8720703125, 46.5703125, 48.2685546875, 49.966796875, 51.6650390625, 53.36328125, 55.0615234375, 56.759765625, 58.4580078125, 60.15625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 1.0, 5.0, 4.0, 11.0, 12.0, 5.0, 9.0, 13.0, 17.0, 22.0, 30.0, 35.0, 29.0, 32.0, 51.0, 50.0, 51.0, 44.0, 52.0, 52.0, 57.0, 37.0, 44.0, 37.0, 52.0, 39.0, 40.0, 33.0, 28.0, 25.0, 22.0, 15.0, 12.0, 6.0, 7.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.413330078125, -22.59228515625, -21.771240234375, -20.9501953125, -20.129150390625, -19.30810546875, -18.487060546875, -17.666015625, -16.844970703125, -16.02392578125, -15.202880859375, -14.3818359375, -13.560791015625, -12.73974609375, -11.918701171875, -11.09765625, -10.276611328125, -9.45556640625, -8.634521484375, -7.8134765625, -6.992431640625, -6.17138671875, -5.350341796875, -4.529296875, -3.708251953125, -2.88720703125, -2.066162109375, -1.2451171875, -0.424072265625, 0.39697265625, 1.218017578125, 2.0390625, 2.860107421875, 3.68115234375, 4.502197265625, 5.3232421875, 6.144287109375, 6.96533203125, 7.786376953125, 8.607421875, 9.428466796875, 10.24951171875, 11.070556640625, 11.8916015625, 12.712646484375, 13.53369140625, 14.354736328125, 15.17578125, 15.996826171875, 16.81787109375, 17.638916015625, 18.4599609375, 19.281005859375, 20.10205078125, 20.923095703125, 21.744140625, 22.565185546875, 23.38623046875, 24.207275390625, 25.0283203125, 25.849365234375, 26.67041015625, 27.491455078125, 28.3125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 1.0, 9.0, 8.0, 8.0, 20.0, 21.0, 30.0, 32.0, 70.0, 98.0, 139.0, 191.0, 375.0, 643.0, 1124.0, 2156.0, 4285.0, 9301.0, 21238.0, 54844.0, 153291.0, 385568.0, 262777.0, 91129.0, 34354.0, 13880.0, 6261.0, 3007.0, 1503.0, 876.0, 496.0, 277.0, 189.0, 123.0, 74.0, 42.0, 35.0, 27.0, 13.0, 15.0, 4.0, 11.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.63037109375, -16.9951171875, -16.35986328125, -15.724609375, -15.08935546875, -14.4541015625, -13.81884765625, -13.18359375, -12.54833984375, -11.9130859375, -11.27783203125, -10.642578125, -10.00732421875, -9.3720703125, -8.73681640625, -8.1015625, -7.46630859375, -6.8310546875, -6.19580078125, -5.560546875, -4.92529296875, -4.2900390625, -3.65478515625, -3.01953125, -2.38427734375, -1.7490234375, -1.11376953125, -0.478515625, 0.15673828125, 0.7919921875, 1.42724609375, 2.0625, 2.69775390625, 3.3330078125, 3.96826171875, 4.603515625, 5.23876953125, 5.8740234375, 6.50927734375, 7.14453125, 7.77978515625, 8.4150390625, 9.05029296875, 9.685546875, 10.32080078125, 10.9560546875, 11.59130859375, 12.2265625, 12.86181640625, 13.4970703125, 14.13232421875, 14.767578125, 15.40283203125, 16.0380859375, 16.67333984375, 17.30859375, 17.94384765625, 18.5791015625, 19.21435546875, 19.849609375, 20.48486328125, 21.1201171875, 21.75537109375, 22.390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 13.0, 12.0, 17.0, 20.0, 37.0, 54.0, 63.0, 94.0, 155.0, 144.0, 124.0, 77.0, 54.0, 43.0, 29.0, 15.0, 8.0, 13.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004970550537109375, -0.004788458347320557, -0.004606366157531738, -0.00442427396774292, -0.0042421817779541016, -0.004060089588165283, -0.003877997398376465, -0.0036959052085876465, -0.003513813018798828, -0.0033317208290100098, -0.0031496286392211914, -0.002967536449432373, -0.0027854442596435547, -0.0026033520698547363, -0.002421259880065918, -0.0022391676902770996, -0.0020570755004882812, -0.0018749833106994629, -0.0016928911209106445, -0.0015107989311218262, -0.0013287067413330078, -0.0011466145515441895, -0.0009645223617553711, -0.0007824301719665527, -0.0006003379821777344, -0.000418245792388916, -0.00023615360260009766, -5.40614128112793e-05, 0.00012803077697753906, 0.0003101229667663574, 0.0004922151565551758, 0.0006743073463439941, 0.0008563995361328125, 0.0010384917259216309, 0.0012205839157104492, 0.0014026761054992676, 0.001584768295288086, 0.0017668604850769043, 0.0019489526748657227, 0.002131044864654541, 0.0023131370544433594, 0.0024952292442321777, 0.002677321434020996, 0.0028594136238098145, 0.003041505813598633, 0.003223598003387451, 0.0034056901931762695, 0.003587782382965088, 0.0037698745727539062, 0.003951966762542725, 0.004134058952331543, 0.004316151142120361, 0.00449824333190918, 0.004680335521697998, 0.004862427711486816, 0.005044519901275635, 0.005226612091064453, 0.0054087042808532715, 0.00559079647064209, 0.005772888660430908, 0.0059549808502197266, 0.006137073040008545, 0.006319165229797363, 0.006501257419586182, 0.006683349609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 12.0, 19.0, 20.0, 40.0, 63.0, 109.0, 212.0, 430.0, 937.0, 2331.0, 7297.0, 28229.0, 161314.0, 673197.0, 138323.0, 25301.0, 6720.0, 2243.0, 872.0, 387.0, 193.0, 100.0, 76.0, 44.0, 23.0, 12.0, 10.0, 14.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.96875, -35.57177734375, -34.1748046875, -32.77783203125, -31.380859375, -29.98388671875, -28.5869140625, -27.18994140625, -25.79296875, -24.39599609375, -22.9990234375, -21.60205078125, -20.205078125, -18.80810546875, -17.4111328125, -16.01416015625, -14.6171875, -13.22021484375, -11.8232421875, -10.42626953125, -9.029296875, -7.63232421875, -6.2353515625, -4.83837890625, -3.44140625, -2.04443359375, -0.6474609375, 0.74951171875, 2.146484375, 3.54345703125, 4.9404296875, 6.33740234375, 7.734375, 9.13134765625, 10.5283203125, 11.92529296875, 13.322265625, 14.71923828125, 16.1162109375, 17.51318359375, 18.91015625, 20.30712890625, 21.7041015625, 23.10107421875, 24.498046875, 25.89501953125, 27.2919921875, 28.68896484375, 30.0859375, 31.48291015625, 32.8798828125, 34.27685546875, 35.673828125, 37.07080078125, 38.4677734375, 39.86474609375, 41.26171875, 42.65869140625, 44.0556640625, 45.45263671875, 46.849609375, 48.24658203125, 49.6435546875, 51.04052734375, 52.4375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 3.0, 9.0, 9.0, 7.0, 8.0, 11.0, 12.0, 22.0, 18.0, 28.0, 31.0, 34.0, 42.0, 50.0, 65.0, 62.0, 79.0, 81.0, 64.0, 75.0, 51.0, 43.0, 35.0, 30.0, 23.0, 10.0, 12.0, 14.0, 11.0, 10.0, 11.0, 11.0, 6.0, 9.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.8828125, -14.3878173828125, -13.892822265625, -13.3978271484375, -12.90283203125, -12.4078369140625, -11.912841796875, -11.4178466796875, -10.9228515625, -10.4278564453125, -9.932861328125, -9.4378662109375, -8.94287109375, -8.4478759765625, -7.952880859375, -7.4578857421875, -6.962890625, -6.4678955078125, -5.972900390625, -5.4779052734375, -4.98291015625, -4.4879150390625, -3.992919921875, -3.4979248046875, -3.0029296875, -2.5079345703125, -2.012939453125, -1.5179443359375, -1.02294921875, -0.5279541015625, -0.032958984375, 0.4620361328125, 0.95703125, 1.4520263671875, 1.947021484375, 2.4420166015625, 2.93701171875, 3.4320068359375, 3.927001953125, 4.4219970703125, 4.9169921875, 5.4119873046875, 5.906982421875, 6.4019775390625, 6.89697265625, 7.3919677734375, 7.886962890625, 8.3819580078125, 8.876953125, 9.3719482421875, 9.866943359375, 10.3619384765625, 10.85693359375, 11.3519287109375, 11.846923828125, 12.3419189453125, 12.8369140625, 13.3319091796875, 13.826904296875, 14.3218994140625, 14.81689453125, 15.3118896484375, 15.806884765625, 16.3018798828125, 16.796875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 12.0, 18.0, 18.0, 51.0, 68.0, 146.0, 157.0, 182.0, 125.0, 76.0, 62.0, 30.0, 22.0, 8.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-250.466064453125, -239.61849975585938, -228.77093505859375, -217.92335510253906, -207.07579040527344, -196.2282257080078, -185.38064575195312, -174.5330810546875, -163.68551635742188, -152.83795166015625, -141.99038696289062, -131.14280700683594, -120.29524230957031, -109.44767761230469, -98.60010528564453, -87.75253295898438, -76.90496826171875, -66.05740356445312, -55.20983123779297, -44.36226272583008, -33.51469421386719, -22.667125701904297, -11.819557189941406, -0.97198486328125, 9.875579833984375, 20.723148345947266, 31.570716857910156, 42.41828536987305, 53.26585388183594, 64.11341857910156, 74.96099090576172, 85.80856323242188, 96.65609741210938, 107.503662109375, 118.35123443603516, 129.1988067626953, 140.04637145996094, 150.89393615722656, 161.74151611328125, 172.58908081054688, 183.4366455078125, 194.28421020507812, 205.13177490234375, 215.97935485839844, 226.82691955566406, 237.6744842529297, 248.52206420898438, 259.36962890625, 270.2171936035156, 281.06475830078125, 291.9123229980469, 302.7598876953125, 313.60748291015625, 324.4550476074219, 335.3026123046875, 346.1501770019531, 356.99774169921875, 367.8453063964844, 378.69287109375, 389.5404357910156, 400.38800048828125, 411.235595703125, 422.0831604003906, 432.93072509765625, 443.7782897949219]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 8.0, 11.0, 10.0, 16.0, 16.0, 9.0, 24.0, 27.0, 29.0, 27.0, 30.0, 30.0, 33.0, 39.0, 35.0, 30.0, 42.0, 54.0, 33.0, 47.0, 40.0, 50.0, 46.0, 28.0, 26.0, 36.0, 34.0, 33.0, 27.0, 14.0, 16.0, 15.0, 10.0, 15.0, 8.0, 7.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-160.94764709472656, -155.8898468017578, -150.83206176757812, -145.77426147460938, -140.7164764404297, -135.65867614746094, -130.60089111328125, -125.5430908203125, -120.48529815673828, -115.42750549316406, -110.36971282958984, -105.31192016601562, -100.25411987304688, -95.19633483886719, -90.13853454589844, -85.08074188232422, -80.02294921875, -74.96515655517578, -69.90736389160156, -64.84957122802734, -59.79177474975586, -54.73398208618164, -49.676185607910156, -44.61839294433594, -39.56060028076172, -34.5028076171875, -29.44501304626465, -24.387218475341797, -19.329425811767578, -14.27163314819336, -9.213838577270508, -4.156044006347656, 0.9017486572265625, 5.959542274475098, 11.017335891723633, 16.075130462646484, 21.132923126220703, 26.190715789794922, 31.248510360717773, 36.306304931640625, 41.364097595214844, 46.42189025878906, 51.47968292236328, 56.537479400634766, 61.595272064208984, 66.65306091308594, 71.71086120605469, 76.7686538696289, 81.82644653320312, 86.88423919677734, 91.94203186035156, 96.99982452392578, 102.0576171875, 107.11541748046875, 112.17321014404297, 117.23100280761719, 122.2887954711914, 127.34658813476562, 132.40438842773438, 137.46217346191406, 142.5199737548828, 147.5777587890625, 152.63555908203125, 157.693359375, 162.7511444091797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 10.0, 7.0, 17.0, 26.0, 36.0, 34.0, 77.0, 112.0, 160.0, 244.0, 407.0, 715.0, 1535.0, 3271.0, 7469.0, 19346.0, 61789.0, 353539.0, 3523583.0, 158653.0, 38272.0, 13807.0, 5669.0, 2631.0, 1298.0, 710.0, 356.0, 201.0, 109.0, 55.0, 54.0, 27.0, 16.0, 8.0, 9.0, 9.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-64.6875, -63.0419921875, -61.396484375, -59.7509765625, -58.10546875, -56.4599609375, -54.814453125, -53.1689453125, -51.5234375, -49.8779296875, -48.232421875, -46.5869140625, -44.94140625, -43.2958984375, -41.650390625, -40.0048828125, -38.359375, -36.7138671875, -35.068359375, -33.4228515625, -31.77734375, -30.1318359375, -28.486328125, -26.8408203125, -25.1953125, -23.5498046875, -21.904296875, -20.2587890625, -18.61328125, -16.9677734375, -15.322265625, -13.6767578125, -12.03125, -10.3857421875, -8.740234375, -7.0947265625, -5.44921875, -3.8037109375, -2.158203125, -0.5126953125, 1.1328125, 2.7783203125, 4.423828125, 6.0693359375, 7.71484375, 9.3603515625, 11.005859375, 12.6513671875, 14.296875, 15.9423828125, 17.587890625, 19.2333984375, 20.87890625, 22.5244140625, 24.169921875, 25.8154296875, 27.4609375, 29.1064453125, 30.751953125, 32.3974609375, 34.04296875, 35.6884765625, 37.333984375, 38.9794921875, 40.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 10.0, 16.0, 14.0, 21.0, 22.0, 32.0, 36.0, 39.0, 53.0, 46.0, 64.0, 54.0, 72.0, 61.0, 64.0, 60.0, 51.0, 43.0, 41.0, 41.0, 33.0, 26.0, 12.0, 25.0, 13.0, 11.0, 12.0, 3.0, 5.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.12109375, -5.9432373046875, -5.765380859375, -5.5875244140625, -5.40966796875, -5.2318115234375, -5.053955078125, -4.8760986328125, -4.6982421875, -4.5203857421875, -4.342529296875, -4.1646728515625, -3.98681640625, -3.8089599609375, -3.631103515625, -3.4532470703125, -3.275390625, -3.0975341796875, -2.919677734375, -2.7418212890625, -2.56396484375, -2.3861083984375, -2.208251953125, -2.0303955078125, -1.8525390625, -1.6746826171875, -1.496826171875, -1.3189697265625, -1.14111328125, -0.9632568359375, -0.785400390625, -0.6075439453125, -0.4296875, -0.2518310546875, -0.073974609375, 0.1038818359375, 0.28173828125, 0.4595947265625, 0.637451171875, 0.8153076171875, 0.9931640625, 1.1710205078125, 1.348876953125, 1.5267333984375, 1.70458984375, 1.8824462890625, 2.060302734375, 2.2381591796875, 2.416015625, 2.5938720703125, 2.771728515625, 2.9495849609375, 3.12744140625, 3.3052978515625, 3.483154296875, 3.6610107421875, 3.8388671875, 4.0167236328125, 4.194580078125, 4.3724365234375, 4.55029296875, 4.7281494140625, 4.906005859375, 5.0838623046875, 5.26171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 13.0, 19.0, 33.0, 34.0, 57.0, 110.0, 158.0, 275.0, 473.0, 825.0, 1521.0, 2989.0, 6576.0, 16666.0, 52132.0, 256378.0, 3425931.0, 337176.0, 60423.0, 18441.0, 7202.0, 3157.0, 1575.0, 826.0, 487.0, 274.0, 183.0, 115.0, 84.0, 50.0, 31.0, 24.0, 14.0, 12.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.59375, -61.8056640625, -60.017578125, -58.2294921875, -56.44140625, -54.6533203125, -52.865234375, -51.0771484375, -49.2890625, -47.5009765625, -45.712890625, -43.9248046875, -42.13671875, -40.3486328125, -38.560546875, -36.7724609375, -34.984375, -33.1962890625, -31.408203125, -29.6201171875, -27.83203125, -26.0439453125, -24.255859375, -22.4677734375, -20.6796875, -18.8916015625, -17.103515625, -15.3154296875, -13.52734375, -11.7392578125, -9.951171875, -8.1630859375, -6.375, -4.5869140625, -2.798828125, -1.0107421875, 0.77734375, 2.5654296875, 4.353515625, 6.1416015625, 7.9296875, 9.7177734375, 11.505859375, 13.2939453125, 15.08203125, 16.8701171875, 18.658203125, 20.4462890625, 22.234375, 24.0224609375, 25.810546875, 27.5986328125, 29.38671875, 31.1748046875, 32.962890625, 34.7509765625, 36.5390625, 38.3271484375, 40.115234375, 41.9033203125, 43.69140625, 45.4794921875, 47.267578125, 49.0556640625, 50.84375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 4.0, 18.0, 13.0, 19.0, 35.0, 36.0, 62.0, 65.0, 96.0, 156.0, 262.0, 537.0, 1779.0, 363.0, 180.0, 128.0, 64.0, 59.0, 40.0, 33.0, 29.0, 17.0, 14.0, 8.0, 2.0, 6.0, 3.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.8203125, -12.4102783203125, -12.000244140625, -11.5902099609375, -11.18017578125, -10.7701416015625, -10.360107421875, -9.9500732421875, -9.5400390625, -9.1300048828125, -8.719970703125, -8.3099365234375, -7.89990234375, -7.4898681640625, -7.079833984375, -6.6697998046875, -6.259765625, -5.8497314453125, -5.439697265625, -5.0296630859375, -4.61962890625, -4.2095947265625, -3.799560546875, -3.3895263671875, -2.9794921875, -2.5694580078125, -2.159423828125, -1.7493896484375, -1.33935546875, -0.9293212890625, -0.519287109375, -0.1092529296875, 0.30078125, 0.7108154296875, 1.120849609375, 1.5308837890625, 1.94091796875, 2.3509521484375, 2.760986328125, 3.1710205078125, 3.5810546875, 3.9910888671875, 4.401123046875, 4.8111572265625, 5.22119140625, 5.6312255859375, 6.041259765625, 6.4512939453125, 6.861328125, 7.2713623046875, 7.681396484375, 8.0914306640625, 8.50146484375, 8.9114990234375, 9.321533203125, 9.7315673828125, 10.1416015625, 10.5516357421875, 10.961669921875, 11.3717041015625, 11.78173828125, 12.1917724609375, 12.601806640625, 13.0118408203125, 13.421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 18.0, 17.0, 22.0, 41.0, 62.0, 74.0, 156.0, 152.0, 127.0, 106.0, 78.0, 56.0, 29.0, 18.0, 9.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-81.20330047607422, -78.2730712890625, -75.34284973144531, -72.41262817382812, -69.4823989868164, -66.55216979980469, -63.6219482421875, -60.69172286987305, -57.761497497558594, -54.83127212524414, -51.90104675292969, -48.970821380615234, -46.04059600830078, -43.11037063598633, -40.180145263671875, -37.24991989135742, -34.31969451904297, -31.389469146728516, -28.459243774414062, -25.52901840209961, -22.598793029785156, -19.668567657470703, -16.73834228515625, -13.808116912841797, -10.877891540527344, -7.947666168212891, -5.0174407958984375, -2.0872154235839844, 0.8430099487304688, 3.773235321044922, 6.703460693359375, 9.633686065673828, 12.563919067382812, 15.494144439697266, 18.42436981201172, 21.354595184326172, 24.284820556640625, 27.215045928955078, 30.14527130126953, 33.075496673583984, 36.00572204589844, 38.93594741821289, 41.866172790527344, 44.7963981628418, 47.72662353515625, 50.6568489074707, 53.587074279785156, 56.51729965209961, 59.44752502441406, 62.377750396728516, 65.30797576904297, 68.23820495605469, 71.16842651367188, 74.09864807128906, 77.02887725830078, 79.9591064453125, 82.88932800292969, 85.81954956054688, 88.7497787475586, 91.68000793457031, 94.6102294921875, 97.54045104980469, 100.4706802368164, 103.40090942382812, 106.33113098144531]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 6.0, 13.0, 8.0, 25.0, 24.0, 15.0, 36.0, 29.0, 40.0, 36.0, 46.0, 40.0, 39.0, 61.0, 41.0, 52.0, 44.0, 43.0, 38.0, 28.0, 41.0, 36.0, 35.0, 32.0, 29.0, 27.0, 17.0, 16.0, 13.0, 11.0, 7.0, 6.0, 12.0, 6.0, 10.0, 10.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.28271484375, -46.7509880065918, -45.21925735473633, -43.687530517578125, -42.15580368041992, -40.62407684326172, -39.09234619140625, -37.56061935424805, -36.028892517089844, -34.49716567993164, -32.96543502807617, -31.43370819091797, -29.901981353759766, -28.37025260925293, -26.838523864746094, -25.30679702758789, -23.775066375732422, -22.243337631225586, -20.711610794067383, -19.179882049560547, -17.648155212402344, -16.116426467895508, -14.584697723388672, -13.052969932556152, -11.521242141723633, -9.989514350891113, -8.457786560058594, -6.926057815551758, -5.394330024719238, -3.8626022338867188, -2.330873489379883, -0.7991456985473633, 0.7325820922851562, 2.264310121536255, 3.7960381507873535, 5.327766418457031, 6.859494209289551, 8.39122200012207, 9.922950744628906, 11.454678535461426, 12.986406326293945, 14.518134117126465, 16.049861907958984, 17.58159065246582, 19.113319396972656, 20.64504623413086, 22.176774978637695, 23.70850372314453, 25.240230560302734, 26.77195930480957, 28.303686141967773, 29.83541488647461, 31.367141723632812, 32.89887237548828, 34.430599212646484, 35.96232604980469, 37.494056701660156, 39.02578353881836, 40.55751419067383, 42.08924102783203, 43.620967864990234, 45.15269470214844, 46.684425354003906, 48.21615219116211, 49.74787902832031]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 11.0, 18.0, 14.0, 31.0, 26.0, 68.0, 72.0, 131.0, 186.0, 287.0, 396.0, 638.0, 1040.0, 1880.0, 3269.0, 5772.0, 11059.0, 22474.0, 46201.0, 98852.0, 211631.0, 311793.0, 173689.0, 81114.0, 38038.0, 18613.0, 9357.0, 4999.0, 2746.0, 1683.0, 955.0, 573.0, 302.0, 220.0, 123.0, 111.0, 62.0, 38.0, 17.0, 18.0, 10.0, 8.0, 8.0, 5.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-25.921875, -25.14501953125, -24.3681640625, -23.59130859375, -22.814453125, -22.03759765625, -21.2607421875, -20.48388671875, -19.70703125, -18.93017578125, -18.1533203125, -17.37646484375, -16.599609375, -15.82275390625, -15.0458984375, -14.26904296875, -13.4921875, -12.71533203125, -11.9384765625, -11.16162109375, -10.384765625, -9.60791015625, -8.8310546875, -8.05419921875, -7.27734375, -6.50048828125, -5.7236328125, -4.94677734375, -4.169921875, -3.39306640625, -2.6162109375, -1.83935546875, -1.0625, -0.28564453125, 0.4912109375, 1.26806640625, 2.044921875, 2.82177734375, 3.5986328125, 4.37548828125, 5.15234375, 5.92919921875, 6.7060546875, 7.48291015625, 8.259765625, 9.03662109375, 9.8134765625, 10.59033203125, 11.3671875, 12.14404296875, 12.9208984375, 13.69775390625, 14.474609375, 15.25146484375, 16.0283203125, 16.80517578125, 17.58203125, 18.35888671875, 19.1357421875, 19.91259765625, 20.689453125, 21.46630859375, 22.2431640625, 23.02001953125, 23.796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 12.0, 18.0, 30.0, 25.0, 29.0, 26.0, 43.0, 43.0, 45.0, 62.0, 67.0, 60.0, 65.0, 55.0, 42.0, 53.0, 48.0, 50.0, 46.0, 25.0, 29.0, 22.0, 18.0, 15.0, 10.0, 5.0, 5.0, 13.0, 3.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75, -5.56817626953125, -5.3863525390625, -5.20452880859375, -5.022705078125, -4.84088134765625, -4.6590576171875, -4.47723388671875, -4.29541015625, -4.11358642578125, -3.9317626953125, -3.74993896484375, -3.568115234375, -3.38629150390625, -3.2044677734375, -3.02264404296875, -2.8408203125, -2.65899658203125, -2.4771728515625, -2.29534912109375, -2.113525390625, -1.93170166015625, -1.7498779296875, -1.56805419921875, -1.38623046875, -1.20440673828125, -1.0225830078125, -0.84075927734375, -0.658935546875, -0.47711181640625, -0.2952880859375, -0.11346435546875, 0.068359375, 0.25018310546875, 0.4320068359375, 0.61383056640625, 0.795654296875, 0.97747802734375, 1.1593017578125, 1.34112548828125, 1.52294921875, 1.70477294921875, 1.8865966796875, 2.06842041015625, 2.250244140625, 2.43206787109375, 2.6138916015625, 2.79571533203125, 2.9775390625, 3.15936279296875, 3.3411865234375, 3.52301025390625, 3.704833984375, 3.88665771484375, 4.0684814453125, 4.25030517578125, 4.43212890625, 4.61395263671875, 4.7957763671875, 4.97760009765625, 5.159423828125, 5.34124755859375, 5.5230712890625, 5.70489501953125, 5.88671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 21.0, 20.0, 23.0, 34.0, 66.0, 116.0, 159.0, 280.0, 468.0, 914.0, 1515.0, 3059.0, 6371.0, 14825.0, 36784.0, 104342.0, 317935.0, 365965.0, 121827.0, 42519.0, 16689.0, 7309.0, 3364.0, 1673.0, 872.0, 524.0, 312.0, 176.0, 128.0, 92.0, 47.0, 31.0, 23.0, 15.0, 13.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.6875, -37.614990234375, -36.54248046875, -35.469970703125, -34.3974609375, -33.324951171875, -32.25244140625, -31.179931640625, -30.107421875, -29.034912109375, -27.96240234375, -26.889892578125, -25.8173828125, -24.744873046875, -23.67236328125, -22.599853515625, -21.52734375, -20.454833984375, -19.38232421875, -18.309814453125, -17.2373046875, -16.164794921875, -15.09228515625, -14.019775390625, -12.947265625, -11.874755859375, -10.80224609375, -9.729736328125, -8.6572265625, -7.584716796875, -6.51220703125, -5.439697265625, -4.3671875, -3.294677734375, -2.22216796875, -1.149658203125, -0.0771484375, 0.995361328125, 2.06787109375, 3.140380859375, 4.212890625, 5.285400390625, 6.35791015625, 7.430419921875, 8.5029296875, 9.575439453125, 10.64794921875, 11.720458984375, 12.79296875, 13.865478515625, 14.93798828125, 16.010498046875, 17.0830078125, 18.155517578125, 19.22802734375, 20.300537109375, 21.373046875, 22.445556640625, 23.51806640625, 24.590576171875, 25.6630859375, 26.735595703125, 27.80810546875, 28.880615234375, 29.953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 5.0, 12.0, 2.0, 3.0, 16.0, 23.0, 21.0, 21.0, 31.0, 42.0, 45.0, 38.0, 65.0, 54.0, 65.0, 57.0, 40.0, 54.0, 51.0, 49.0, 52.0, 40.0, 26.0, 33.0, 22.0, 24.0, 18.0, 13.0, 18.0, 12.0, 9.0, 6.0, 4.0, 3.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.21875, -32.24267578125, -31.2666015625, -30.29052734375, -29.314453125, -28.33837890625, -27.3623046875, -26.38623046875, -25.41015625, -24.43408203125, -23.4580078125, -22.48193359375, -21.505859375, -20.52978515625, -19.5537109375, -18.57763671875, -17.6015625, -16.62548828125, -15.6494140625, -14.67333984375, -13.697265625, -12.72119140625, -11.7451171875, -10.76904296875, -9.79296875, -8.81689453125, -7.8408203125, -6.86474609375, -5.888671875, -4.91259765625, -3.9365234375, -2.96044921875, -1.984375, -1.00830078125, -0.0322265625, 0.94384765625, 1.919921875, 2.89599609375, 3.8720703125, 4.84814453125, 5.82421875, 6.80029296875, 7.7763671875, 8.75244140625, 9.728515625, 10.70458984375, 11.6806640625, 12.65673828125, 13.6328125, 14.60888671875, 15.5849609375, 16.56103515625, 17.537109375, 18.51318359375, 19.4892578125, 20.46533203125, 21.44140625, 22.41748046875, 23.3935546875, 24.36962890625, 25.345703125, 26.32177734375, 27.2978515625, 28.27392578125, 29.25]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 16.0, 13.0, 13.0, 22.0, 28.0, 46.0, 59.0, 90.0, 138.0, 198.0, 250.0, 486.0, 873.0, 1454.0, 2792.0, 5890.0, 14037.0, 39795.0, 139089.0, 444961.0, 282633.0, 74082.0, 23604.0, 9098.0, 4021.0, 2019.0, 1082.0, 623.0, 349.0, 230.0, 158.0, 98.0, 96.0, 55.0, 43.0, 32.0, 21.0, 18.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0], "bins": [-16.828125, -16.314453125, -15.80078125, -15.287109375, -14.7734375, -14.259765625, -13.74609375, -13.232421875, -12.71875, -12.205078125, -11.69140625, -11.177734375, -10.6640625, -10.150390625, -9.63671875, -9.123046875, -8.609375, -8.095703125, -7.58203125, -7.068359375, -6.5546875, -6.041015625, -5.52734375, -5.013671875, -4.5, -3.986328125, -3.47265625, -2.958984375, -2.4453125, -1.931640625, -1.41796875, -0.904296875, -0.390625, 0.123046875, 0.63671875, 1.150390625, 1.6640625, 2.177734375, 2.69140625, 3.205078125, 3.71875, 4.232421875, 4.74609375, 5.259765625, 5.7734375, 6.287109375, 6.80078125, 7.314453125, 7.828125, 8.341796875, 8.85546875, 9.369140625, 9.8828125, 10.396484375, 10.91015625, 11.423828125, 11.9375, 12.451171875, 12.96484375, 13.478515625, 13.9921875, 14.505859375, 15.01953125, 15.533203125, 16.046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 0.0, 5.0, 6.0, 7.0, 7.0, 6.0, 19.0, 13.0, 21.0, 33.0, 39.0, 67.0, 111.0, 111.0, 125.0, 104.0, 98.0, 66.0, 42.0, 34.0, 20.0, 18.0, 10.0, 9.0, 6.0, 4.0, 1.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030345916748046875, -0.002905339002609253, -0.0027760863304138184, -0.002646833658218384, -0.0025175809860229492, -0.0023883283138275146, -0.00225907564163208, -0.0021298229694366455, -0.002000570297241211, -0.0018713176250457764, -0.0017420649528503418, -0.0016128122806549072, -0.0014835596084594727, -0.001354306936264038, -0.0012250542640686035, -0.001095801591873169, -0.0009665489196777344, -0.0008372962474822998, -0.0007080435752868652, -0.0005787909030914307, -0.0004495382308959961, -0.0003202855587005615, -0.00019103288650512695, -6.178021430969238e-05, 6.747245788574219e-05, 0.00019672513008117676, 0.00032597780227661133, 0.0004552304744720459, 0.0005844831466674805, 0.000713735818862915, 0.0008429884910583496, 0.0009722411632537842, 0.0011014938354492188, 0.0012307465076446533, 0.0013599991798400879, 0.0014892518520355225, 0.001618504524230957, 0.0017477571964263916, 0.0018770098686218262, 0.0020062625408172607, 0.0021355152130126953, 0.00226476788520813, 0.0023940205574035645, 0.002523273229598999, 0.0026525259017944336, 0.002781778573989868, 0.0029110312461853027, 0.0030402839183807373, 0.003169536590576172, 0.0032987892627716064, 0.003428041934967041, 0.0035572946071624756, 0.00368654727935791, 0.0038157999515533447, 0.003945052623748779, 0.004074305295944214, 0.0042035579681396484, 0.004332810640335083, 0.004462063312530518, 0.004591315984725952, 0.004720568656921387, 0.004849821329116821, 0.004979074001312256, 0.00510832667350769, 0.005237579345703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 3.0, 11.0, 13.0, 15.0, 18.0, 32.0, 29.0, 41.0, 63.0, 97.0, 148.0, 219.0, 304.0, 566.0, 895.0, 1642.0, 3455.0, 8130.0, 24018.0, 96368.0, 453432.0, 353777.0, 72707.0, 19234.0, 6634.0, 2914.0, 1514.0, 822.0, 513.0, 280.0, 212.0, 115.0, 94.0, 62.0, 56.0, 39.0, 15.0, 12.0, 10.0, 16.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.24951171875, -16.6083984375, -15.96728515625, -15.326171875, -14.68505859375, -14.0439453125, -13.40283203125, -12.76171875, -12.12060546875, -11.4794921875, -10.83837890625, -10.197265625, -9.55615234375, -8.9150390625, -8.27392578125, -7.6328125, -6.99169921875, -6.3505859375, -5.70947265625, -5.068359375, -4.42724609375, -3.7861328125, -3.14501953125, -2.50390625, -1.86279296875, -1.2216796875, -0.58056640625, 0.060546875, 0.70166015625, 1.3427734375, 1.98388671875, 2.625, 3.26611328125, 3.9072265625, 4.54833984375, 5.189453125, 5.83056640625, 6.4716796875, 7.11279296875, 7.75390625, 8.39501953125, 9.0361328125, 9.67724609375, 10.318359375, 10.95947265625, 11.6005859375, 12.24169921875, 12.8828125, 13.52392578125, 14.1650390625, 14.80615234375, 15.447265625, 16.08837890625, 16.7294921875, 17.37060546875, 18.01171875, 18.65283203125, 19.2939453125, 19.93505859375, 20.576171875, 21.21728515625, 21.8583984375, 22.49951171875, 23.140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 4.0, 15.0, 29.0, 36.0, 42.0, 63.0, 101.0, 119.0, 128.0, 113.0, 107.0, 85.0, 45.0, 29.0, 21.0, 17.0, 13.0, 7.0, 5.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.90087890625, -15.2548828125, -14.60888671875, -13.962890625, -13.31689453125, -12.6708984375, -12.02490234375, -11.37890625, -10.73291015625, -10.0869140625, -9.44091796875, -8.794921875, -8.14892578125, -7.5029296875, -6.85693359375, -6.2109375, -5.56494140625, -4.9189453125, -4.27294921875, -3.626953125, -2.98095703125, -2.3349609375, -1.68896484375, -1.04296875, -0.39697265625, 0.2490234375, 0.89501953125, 1.541015625, 2.18701171875, 2.8330078125, 3.47900390625, 4.125, 4.77099609375, 5.4169921875, 6.06298828125, 6.708984375, 7.35498046875, 8.0009765625, 8.64697265625, 9.29296875, 9.93896484375, 10.5849609375, 11.23095703125, 11.876953125, 12.52294921875, 13.1689453125, 13.81494140625, 14.4609375, 15.10693359375, 15.7529296875, 16.39892578125, 17.044921875, 17.69091796875, 18.3369140625, 18.98291015625, 19.62890625, 20.27490234375, 20.9208984375, 21.56689453125, 22.212890625, 22.85888671875, 23.5048828125, 24.15087890625, 24.796875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 26.0, 49.0, 125.0, 311.0, 293.0, 134.0, 40.0, 21.0, 5.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-432.3655700683594, -411.714111328125, -391.0626220703125, -370.4111328125, -349.7596740722656, -329.10821533203125, -308.45672607421875, -287.80523681640625, -267.1537780761719, -246.50230407714844, -225.850830078125, -205.19935607910156, -184.54788208007812, -163.8964080810547, -143.24493408203125, -122.59346008300781, -101.94198608398438, -81.29051208496094, -60.6390380859375, -39.98756408691406, -19.336090087890625, 1.3153839111328125, 21.96685791015625, 42.61833190917969, 63.269805908203125, 83.92127990722656, 104.57275390625, 125.22422790527344, 145.87570190429688, 166.5271759033203, 187.17864990234375, 207.8301239013672, 228.4815673828125, 249.13304138183594, 269.7845153808594, 290.43597412109375, 311.08746337890625, 331.73895263671875, 352.3904113769531, 373.0418701171875, 393.693359375, 414.3448486328125, 434.9963073730469, 455.64776611328125, 476.29925537109375, 496.95074462890625, 517.6021728515625, 538.253662109375, 558.9051513671875, 579.556640625, 600.2081298828125, 620.8595581054688, 641.5110473632812, 662.1625366210938, 682.81396484375, 703.4654541015625, 724.116943359375, 744.7684326171875, 765.419921875, 786.0713500976562, 806.7228393554688, 827.3743286132812, 848.0257568359375, 868.67724609375, 889.3287353515625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 3.0, 1.0, 7.0, 14.0, 8.0, 10.0, 18.0, 22.0, 38.0, 44.0, 43.0, 45.0, 51.0, 58.0, 72.0, 66.0, 69.0, 49.0, 64.0, 40.0, 54.0, 36.0, 40.0, 33.0, 18.0, 25.0, 19.0, 16.0, 12.0, 9.0, 4.0, 11.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.98704528808594, -127.05823516845703, -120.12942504882812, -113.20062255859375, -106.27181243896484, -99.34300231933594, -92.41419982910156, -85.48538970947266, -78.55657958984375, -71.62776947021484, -64.69895935058594, -57.77015686035156, -50.841346740722656, -43.91253662109375, -36.98373031616211, -30.05492401123047, -23.126113891601562, -16.19730567932129, -9.268497467041016, -2.339689254760742, 4.589118957519531, 11.517929077148438, 18.446735382080078, 25.37554168701172, 32.304351806640625, 39.23316192626953, 46.16196823120117, 53.09077453613281, 60.01958465576172, 66.94839477539062, 73.877197265625, 80.8060073852539, 87.73483276367188, 94.66364288330078, 101.59245300292969, 108.52125549316406, 115.45006561279297, 122.37887573242188, 129.30767822265625, 136.23648071289062, 143.16529846191406, 150.09410095214844, 157.02291870117188, 163.95172119140625, 170.88052368164062, 177.80934143066406, 184.73814392089844, 191.66696166992188, 198.59576416015625, 205.52456665039062, 212.45338439941406, 219.38218688964844, 226.31100463867188, 233.23980712890625, 240.16860961914062, 247.097412109375, 254.02622985839844, 260.9550476074219, 267.88385009765625, 274.8126525878906, 281.741455078125, 288.6702880859375, 295.5990905761719, 302.52789306640625, 309.4566955566406]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 13.0, 9.0, 8.0, 16.0, 30.0, 56.0, 39.0, 48.0, 99.0, 153.0, 229.0, 360.0, 586.0, 962.0, 1797.0, 3294.0, 6100.0, 12796.0, 29957.0, 94175.0, 2820837.0, 1077015.0, 89594.0, 29348.0, 12570.0, 6040.0, 3262.0, 1889.0, 1058.0, 637.0, 420.0, 289.0, 168.0, 128.0, 90.0, 56.0, 44.0, 24.0, 20.0, 18.0, 13.0, 7.0, 4.0, 9.0, 2.0, 4.0], "bins": [-46.53125, -45.337646484375, -44.14404296875, -42.950439453125, -41.7568359375, -40.563232421875, -39.36962890625, -38.176025390625, -36.982421875, -35.788818359375, -34.59521484375, -33.401611328125, -32.2080078125, -31.014404296875, -29.82080078125, -28.627197265625, -27.43359375, -26.239990234375, -25.04638671875, -23.852783203125, -22.6591796875, -21.465576171875, -20.27197265625, -19.078369140625, -17.884765625, -16.691162109375, -15.49755859375, -14.303955078125, -13.1103515625, -11.916748046875, -10.72314453125, -9.529541015625, -8.3359375, -7.142333984375, -5.94873046875, -4.755126953125, -3.5615234375, -2.367919921875, -1.17431640625, 0.019287109375, 1.212890625, 2.406494140625, 3.60009765625, 4.793701171875, 5.9873046875, 7.180908203125, 8.37451171875, 9.568115234375, 10.76171875, 11.955322265625, 13.14892578125, 14.342529296875, 15.5361328125, 16.729736328125, 17.92333984375, 19.116943359375, 20.310546875, 21.504150390625, 22.69775390625, 23.891357421875, 25.0849609375, 26.278564453125, 27.47216796875, 28.665771484375, 29.859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 11.0, 11.0, 25.0, 28.0, 30.0, 54.0, 46.0, 61.0, 62.0, 82.0, 82.0, 86.0, 69.0, 63.0, 65.0, 50.0, 50.0, 33.0, 25.0, 19.0, 11.0, 7.0, 10.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.678955078125, -6.41259765625, -6.146240234375, -5.8798828125, -5.613525390625, -5.34716796875, -5.080810546875, -4.814453125, -4.548095703125, -4.28173828125, -4.015380859375, -3.7490234375, -3.482666015625, -3.21630859375, -2.949951171875, -2.68359375, -2.417236328125, -2.15087890625, -1.884521484375, -1.6181640625, -1.351806640625, -1.08544921875, -0.819091796875, -0.552734375, -0.286376953125, -0.02001953125, 0.246337890625, 0.5126953125, 0.779052734375, 1.04541015625, 1.311767578125, 1.578125, 1.844482421875, 2.11083984375, 2.377197265625, 2.6435546875, 2.909912109375, 3.17626953125, 3.442626953125, 3.708984375, 3.975341796875, 4.24169921875, 4.508056640625, 4.7744140625, 5.040771484375, 5.30712890625, 5.573486328125, 5.83984375, 6.106201171875, 6.37255859375, 6.638916015625, 6.9052734375, 7.171630859375, 7.43798828125, 7.704345703125, 7.970703125, 8.237060546875, 8.50341796875, 8.769775390625, 9.0361328125, 9.302490234375, 9.56884765625, 9.835205078125, 10.1015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 1.0, 4.0, 12.0, 13.0, 7.0, 15.0, 36.0, 46.0, 60.0, 102.0, 142.0, 217.0, 386.0, 625.0, 1217.0, 2132.0, 4372.0, 9660.0, 22993.0, 67920.0, 319793.0, 3439845.0, 233334.0, 55379.0, 19674.0, 8271.0, 3716.0, 1841.0, 1009.0, 509.0, 306.0, 202.0, 141.0, 90.0, 55.0, 47.0, 34.0, 25.0, 19.0, 12.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.96875, -45.52001953125, -44.0712890625, -42.62255859375, -41.173828125, -39.72509765625, -38.2763671875, -36.82763671875, -35.37890625, -33.93017578125, -32.4814453125, -31.03271484375, -29.583984375, -28.13525390625, -26.6865234375, -25.23779296875, -23.7890625, -22.34033203125, -20.8916015625, -19.44287109375, -17.994140625, -16.54541015625, -15.0966796875, -13.64794921875, -12.19921875, -10.75048828125, -9.3017578125, -7.85302734375, -6.404296875, -4.95556640625, -3.5068359375, -2.05810546875, -0.609375, 0.83935546875, 2.2880859375, 3.73681640625, 5.185546875, 6.63427734375, 8.0830078125, 9.53173828125, 10.98046875, 12.42919921875, 13.8779296875, 15.32666015625, 16.775390625, 18.22412109375, 19.6728515625, 21.12158203125, 22.5703125, 24.01904296875, 25.4677734375, 26.91650390625, 28.365234375, 29.81396484375, 31.2626953125, 32.71142578125, 34.16015625, 35.60888671875, 37.0576171875, 38.50634765625, 39.955078125, 41.40380859375, 42.8525390625, 44.30126953125, 45.75]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 4.0, 3.0, 5.0, 10.0, 12.0, 13.0, 16.0, 21.0, 33.0, 49.0, 76.0, 98.0, 168.0, 343.0, 2202.0, 470.0, 194.0, 106.0, 71.0, 54.0, 35.0, 23.0, 20.0, 12.0, 11.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4375, -14.94921875, -14.4609375, -13.97265625, -13.484375, -12.99609375, -12.5078125, -12.01953125, -11.53125, -11.04296875, -10.5546875, -10.06640625, -9.578125, -9.08984375, -8.6015625, -8.11328125, -7.625, -7.13671875, -6.6484375, -6.16015625, -5.671875, -5.18359375, -4.6953125, -4.20703125, -3.71875, -3.23046875, -2.7421875, -2.25390625, -1.765625, -1.27734375, -0.7890625, -0.30078125, 0.1875, 0.67578125, 1.1640625, 1.65234375, 2.140625, 2.62890625, 3.1171875, 3.60546875, 4.09375, 4.58203125, 5.0703125, 5.55859375, 6.046875, 6.53515625, 7.0234375, 7.51171875, 8.0, 8.48828125, 8.9765625, 9.46484375, 9.953125, 10.44140625, 10.9296875, 11.41796875, 11.90625, 12.39453125, 12.8828125, 13.37109375, 13.859375, 14.34765625, 14.8359375, 15.32421875, 15.8125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 6.0, 13.0, 17.0, 29.0, 52.0, 83.0, 105.0, 144.0, 154.0, 140.0, 94.0, 69.0, 45.0, 10.0, 20.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-96.26805114746094, -93.10364532470703, -89.9392318725586, -86.77482604980469, -83.61042022705078, -80.44601440429688, -77.28160095214844, -74.11719512939453, -70.95278930664062, -67.78838348388672, -64.62397003173828, -61.459564208984375, -58.29515838623047, -55.1307487487793, -51.966339111328125, -48.80193328857422, -45.63751983642578, -42.47311019897461, -39.3087043762207, -36.14429473876953, -32.979888916015625, -29.815479278564453, -26.65106964111328, -23.486661911010742, -20.322254180908203, -17.157846450805664, -13.993437767028809, -10.829029083251953, -7.664621353149414, -4.500213623046875, -1.3358039855957031, 1.828603744506836, 4.993019104003906, 8.157426834106445, 11.3218355178833, 14.486244201660156, 17.650651931762695, 20.815059661865234, 23.979469299316406, 27.143877029418945, 30.308284759521484, 33.472694396972656, 36.63710021972656, 39.801509857177734, 42.965919494628906, 46.13032531738281, 49.294734954833984, 52.459144592285156, 55.62355041503906, 58.787960052490234, 61.95236587524414, 65.11677551269531, 68.28118133544922, 71.44558715820312, 74.61000061035156, 77.77440643310547, 80.93881225585938, 84.10321807861328, 87.26763153076172, 90.43203735351562, 93.59644317626953, 96.76084899902344, 99.92526245117188, 103.08966827392578, 106.25408172607422]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 10.0, 6.0, 16.0, 10.0, 15.0, 19.0, 12.0, 28.0, 37.0, 30.0, 33.0, 44.0, 44.0, 52.0, 57.0, 63.0, 50.0, 65.0, 58.0, 43.0, 51.0, 50.0, 44.0, 32.0, 24.0, 35.0, 13.0, 20.0, 17.0, 9.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.17987060546875, -60.27134704589844, -58.36282730102539, -56.45430374145508, -54.545780181884766, -52.63726043701172, -50.728736877441406, -48.820213317871094, -46.91168975830078, -45.00316619873047, -43.09464645385742, -41.18612289428711, -39.2775993347168, -37.36907958984375, -35.46055603027344, -33.552032470703125, -31.643512725830078, -29.7349910736084, -27.826467514038086, -25.917945861816406, -24.009422302246094, -22.100900650024414, -20.192378997802734, -18.283855438232422, -16.375333786010742, -14.466811180114746, -12.55828857421875, -10.64976692199707, -8.741244316101074, -6.832721710205078, -4.924200057983398, -3.0156774520874023, -1.1071548461914062, 0.8013675212860107, 2.7098898887634277, 4.618412017822266, 6.526934623718262, 8.435457229614258, 10.343978881835938, 12.252501487731934, 14.16102409362793, 16.06954574584961, 17.978069305419922, 19.8865909576416, 21.79511260986328, 23.703636169433594, 25.612157821655273, 27.520679473876953, 29.429203033447266, 31.337724685668945, 33.246246337890625, 35.15476989746094, 37.06329345703125, 38.97181701660156, 40.88033676147461, 42.78886032104492, 44.69738006591797, 46.60590362548828, 48.51442337036133, 50.42294692993164, 52.33147048950195, 54.239990234375, 56.14851379394531, 58.057037353515625, 59.96556091308594]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 9.0, 8.0, 10.0, 24.0, 34.0, 35.0, 56.0, 86.0, 119.0, 207.0, 282.0, 462.0, 762.0, 1261.0, 2208.0, 3913.0, 7131.0, 13323.0, 26350.0, 54431.0, 113010.0, 240900.0, 295633.0, 147638.0, 69736.0, 33691.0, 16960.0, 8930.0, 4622.0, 2736.0, 1549.0, 922.0, 510.0, 365.0, 202.0, 165.0, 97.0, 51.0, 40.0, 34.0, 16.0, 9.0, 11.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.265625, -23.433837890625, -22.60205078125, -21.770263671875, -20.9384765625, -20.106689453125, -19.27490234375, -18.443115234375, -17.611328125, -16.779541015625, -15.94775390625, -15.115966796875, -14.2841796875, -13.452392578125, -12.62060546875, -11.788818359375, -10.95703125, -10.125244140625, -9.29345703125, -8.461669921875, -7.6298828125, -6.798095703125, -5.96630859375, -5.134521484375, -4.302734375, -3.470947265625, -2.63916015625, -1.807373046875, -0.9755859375, -0.143798828125, 0.68798828125, 1.519775390625, 2.3515625, 3.183349609375, 4.01513671875, 4.846923828125, 5.6787109375, 6.510498046875, 7.34228515625, 8.174072265625, 9.005859375, 9.837646484375, 10.66943359375, 11.501220703125, 12.3330078125, 13.164794921875, 13.99658203125, 14.828369140625, 15.66015625, 16.491943359375, 17.32373046875, 18.155517578125, 18.9873046875, 19.819091796875, 20.65087890625, 21.482666015625, 22.314453125, 23.146240234375, 23.97802734375, 24.809814453125, 25.6416015625, 26.473388671875, 27.30517578125, 28.136962890625, 28.96875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 8.0, 6.0, 17.0, 18.0, 16.0, 22.0, 35.0, 36.0, 34.0, 33.0, 42.0, 43.0, 52.0, 51.0, 46.0, 52.0, 50.0, 47.0, 51.0, 52.0, 45.0, 39.0, 34.0, 28.0, 29.0, 18.0, 19.0, 16.0, 9.0, 9.0, 12.0, 4.0, 5.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.48828125, -6.29949951171875, -6.1107177734375, -5.92193603515625, -5.733154296875, -5.54437255859375, -5.3555908203125, -5.16680908203125, -4.97802734375, -4.78924560546875, -4.6004638671875, -4.41168212890625, -4.222900390625, -4.03411865234375, -3.8453369140625, -3.65655517578125, -3.4677734375, -3.27899169921875, -3.0902099609375, -2.90142822265625, -2.712646484375, -2.52386474609375, -2.3350830078125, -2.14630126953125, -1.95751953125, -1.76873779296875, -1.5799560546875, -1.39117431640625, -1.202392578125, -1.01361083984375, -0.8248291015625, -0.63604736328125, -0.447265625, -0.25848388671875, -0.0697021484375, 0.11907958984375, 0.307861328125, 0.49664306640625, 0.6854248046875, 0.87420654296875, 1.06298828125, 1.25177001953125, 1.4405517578125, 1.62933349609375, 1.818115234375, 2.00689697265625, 2.1956787109375, 2.38446044921875, 2.5732421875, 2.76202392578125, 2.9508056640625, 3.13958740234375, 3.328369140625, 3.51715087890625, 3.7059326171875, 3.89471435546875, 4.08349609375, 4.27227783203125, 4.4610595703125, 4.64984130859375, 4.838623046875, 5.02740478515625, 5.2161865234375, 5.40496826171875, 5.59375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 2.0, 7.0, 12.0, 25.0, 18.0, 42.0, 53.0, 80.0, 99.0, 151.0, 278.0, 413.0, 659.0, 1155.0, 2141.0, 4237.0, 9061.0, 21225.0, 52775.0, 148034.0, 384038.0, 266972.0, 93917.0, 34946.0, 14701.0, 6347.0, 3151.0, 1620.0, 910.0, 524.0, 325.0, 219.0, 126.0, 92.0, 64.0, 49.0, 18.0, 22.0, 17.0, 14.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.09375, -30.145263671875, -29.19677734375, -28.248291015625, -27.2998046875, -26.351318359375, -25.40283203125, -24.454345703125, -23.505859375, -22.557373046875, -21.60888671875, -20.660400390625, -19.7119140625, -18.763427734375, -17.81494140625, -16.866455078125, -15.91796875, -14.969482421875, -14.02099609375, -13.072509765625, -12.1240234375, -11.175537109375, -10.22705078125, -9.278564453125, -8.330078125, -7.381591796875, -6.43310546875, -5.484619140625, -4.5361328125, -3.587646484375, -2.63916015625, -1.690673828125, -0.7421875, 0.206298828125, 1.15478515625, 2.103271484375, 3.0517578125, 4.000244140625, 4.94873046875, 5.897216796875, 6.845703125, 7.794189453125, 8.74267578125, 9.691162109375, 10.6396484375, 11.588134765625, 12.53662109375, 13.485107421875, 14.43359375, 15.382080078125, 16.33056640625, 17.279052734375, 18.2275390625, 19.176025390625, 20.12451171875, 21.072998046875, 22.021484375, 22.969970703125, 23.91845703125, 24.866943359375, 25.8154296875, 26.763916015625, 27.71240234375, 28.660888671875, 29.609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 6.0, 4.0, 3.0, 11.0, 10.0, 16.0, 8.0, 17.0, 31.0, 24.0, 25.0, 29.0, 26.0, 48.0, 38.0, 56.0, 51.0, 65.0, 49.0, 47.0, 64.0, 65.0, 38.0, 47.0, 36.0, 41.0, 33.0, 21.0, 23.0, 24.0, 20.0, 10.0, 3.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.375, -32.386474609375, -31.39794921875, -30.409423828125, -29.4208984375, -28.432373046875, -27.44384765625, -26.455322265625, -25.466796875, -24.478271484375, -23.48974609375, -22.501220703125, -21.5126953125, -20.524169921875, -19.53564453125, -18.547119140625, -17.55859375, -16.570068359375, -15.58154296875, -14.593017578125, -13.6044921875, -12.615966796875, -11.62744140625, -10.638916015625, -9.650390625, -8.661865234375, -7.67333984375, -6.684814453125, -5.6962890625, -4.707763671875, -3.71923828125, -2.730712890625, -1.7421875, -0.753662109375, 0.23486328125, 1.223388671875, 2.2119140625, 3.200439453125, 4.18896484375, 5.177490234375, 6.166015625, 7.154541015625, 8.14306640625, 9.131591796875, 10.1201171875, 11.108642578125, 12.09716796875, 13.085693359375, 14.07421875, 15.062744140625, 16.05126953125, 17.039794921875, 18.0283203125, 19.016845703125, 20.00537109375, 20.993896484375, 21.982421875, 22.970947265625, 23.95947265625, 24.947998046875, 25.9365234375, 26.925048828125, 27.91357421875, 28.902099609375, 29.890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 7.0, 26.0, 34.0, 52.0, 69.0, 104.0, 187.0, 354.0, 490.0, 888.0, 1655.0, 3198.0, 7489.0, 22159.0, 116825.0, 647692.0, 198656.0, 30890.0, 9331.0, 4007.0, 1897.0, 1025.0, 564.0, 336.0, 221.0, 136.0, 85.0, 55.0, 36.0, 22.0, 18.0, 8.0, 9.0, 8.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.203125, -26.39404296875, -25.5849609375, -24.77587890625, -23.966796875, -23.15771484375, -22.3486328125, -21.53955078125, -20.73046875, -19.92138671875, -19.1123046875, -18.30322265625, -17.494140625, -16.68505859375, -15.8759765625, -15.06689453125, -14.2578125, -13.44873046875, -12.6396484375, -11.83056640625, -11.021484375, -10.21240234375, -9.4033203125, -8.59423828125, -7.78515625, -6.97607421875, -6.1669921875, -5.35791015625, -4.548828125, -3.73974609375, -2.9306640625, -2.12158203125, -1.3125, -0.50341796875, 0.3056640625, 1.11474609375, 1.923828125, 2.73291015625, 3.5419921875, 4.35107421875, 5.16015625, 5.96923828125, 6.7783203125, 7.58740234375, 8.396484375, 9.20556640625, 10.0146484375, 10.82373046875, 11.6328125, 12.44189453125, 13.2509765625, 14.06005859375, 14.869140625, 15.67822265625, 16.4873046875, 17.29638671875, 18.10546875, 18.91455078125, 19.7236328125, 20.53271484375, 21.341796875, 22.15087890625, 22.9599609375, 23.76904296875, 24.578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 11.0, 21.0, 39.0, 60.0, 140.0, 235.0, 204.0, 90.0, 61.0, 40.0, 18.0, 7.0, 12.0, 9.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007381439208984375, -0.00712507963180542, -0.006868720054626465, -0.00661236047744751, -0.006356000900268555, -0.0060996413230896, -0.0058432817459106445, -0.0055869221687316895, -0.005330562591552734, -0.005074203014373779, -0.004817843437194824, -0.004561483860015869, -0.004305124282836914, -0.004048764705657959, -0.003792405128479004, -0.003536045551300049, -0.0032796859741210938, -0.0030233263969421387, -0.0027669668197631836, -0.0025106072425842285, -0.0022542476654052734, -0.0019978880882263184, -0.0017415285110473633, -0.0014851689338684082, -0.0012288093566894531, -0.000972449779510498, -0.000716090202331543, -0.0004597306251525879, -0.0002033710479736328, 5.2988529205322266e-05, 0.00030934810638427734, 0.0005657076835632324, 0.0008220672607421875, 0.0010784268379211426, 0.0013347864151000977, 0.0015911459922790527, 0.0018475055694580078, 0.002103865146636963, 0.002360224723815918, 0.002616584300994873, 0.002872943878173828, 0.003129303455352783, 0.0033856630325317383, 0.0036420226097106934, 0.0038983821868896484, 0.0041547417640686035, 0.004411101341247559, 0.004667460918426514, 0.004923820495605469, 0.005180180072784424, 0.005436539649963379, 0.005692899227142334, 0.005949258804321289, 0.006205618381500244, 0.006461977958679199, 0.006718337535858154, 0.006974697113037109, 0.0072310566902160645, 0.0074874162673950195, 0.007743775844573975, 0.00800013542175293, 0.008256494998931885, 0.00851285457611084, 0.008769214153289795, 0.00902557373046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 7.0, 11.0, 11.0, 16.0, 24.0, 23.0, 42.0, 68.0, 105.0, 154.0, 208.0, 345.0, 525.0, 919.0, 1603.0, 3137.0, 6666.0, 17359.0, 74089.0, 564272.0, 312702.0, 43067.0, 12141.0, 5102.0, 2544.0, 1271.0, 805.0, 445.0, 286.0, 193.0, 127.0, 91.0, 50.0, 44.0, 34.0, 17.0, 15.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.046875, -25.228759765625, -24.41064453125, -23.592529296875, -22.7744140625, -21.956298828125, -21.13818359375, -20.320068359375, -19.501953125, -18.683837890625, -17.86572265625, -17.047607421875, -16.2294921875, -15.411376953125, -14.59326171875, -13.775146484375, -12.95703125, -12.138916015625, -11.32080078125, -10.502685546875, -9.6845703125, -8.866455078125, -8.04833984375, -7.230224609375, -6.412109375, -5.593994140625, -4.77587890625, -3.957763671875, -3.1396484375, -2.321533203125, -1.50341796875, -0.685302734375, 0.1328125, 0.950927734375, 1.76904296875, 2.587158203125, 3.4052734375, 4.223388671875, 5.04150390625, 5.859619140625, 6.677734375, 7.495849609375, 8.31396484375, 9.132080078125, 9.9501953125, 10.768310546875, 11.58642578125, 12.404541015625, 13.22265625, 14.040771484375, 14.85888671875, 15.677001953125, 16.4951171875, 17.313232421875, 18.13134765625, 18.949462890625, 19.767578125, 20.585693359375, 21.40380859375, 22.221923828125, 23.0400390625, 23.858154296875, 24.67626953125, 25.494384765625, 26.3125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 7.0, 2.0, 6.0, 6.0, 6.0, 17.0, 11.0, 39.0, 60.0, 60.0, 100.0, 131.0, 147.0, 126.0, 99.0, 53.0, 50.0, 23.0, 19.0, 10.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.96875, -24.279296875, -23.58984375, -22.900390625, -22.2109375, -21.521484375, -20.83203125, -20.142578125, -19.453125, -18.763671875, -18.07421875, -17.384765625, -16.6953125, -16.005859375, -15.31640625, -14.626953125, -13.9375, -13.248046875, -12.55859375, -11.869140625, -11.1796875, -10.490234375, -9.80078125, -9.111328125, -8.421875, -7.732421875, -7.04296875, -6.353515625, -5.6640625, -4.974609375, -4.28515625, -3.595703125, -2.90625, -2.216796875, -1.52734375, -0.837890625, -0.1484375, 0.541015625, 1.23046875, 1.919921875, 2.609375, 3.298828125, 3.98828125, 4.677734375, 5.3671875, 6.056640625, 6.74609375, 7.435546875, 8.125, 8.814453125, 9.50390625, 10.193359375, 10.8828125, 11.572265625, 12.26171875, 12.951171875, 13.640625, 14.330078125, 15.01953125, 15.708984375, 16.3984375, 17.087890625, 17.77734375, 18.466796875, 19.15625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 15.0, 24.0, 86.0, 172.0, 295.0, 228.0, 110.0, 35.0, 22.0, 10.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-733.7855224609375, -717.6943969726562, -701.603271484375, -685.5120849609375, -669.4209594726562, -653.329833984375, -637.2387084960938, -621.1475830078125, -605.056396484375, -588.9652709960938, -572.8741455078125, -556.782958984375, -540.6918334960938, -524.6007080078125, -508.50958251953125, -492.4184265136719, -476.3273010253906, -460.2361755371094, -444.14501953125, -428.05389404296875, -411.9627380371094, -395.8716125488281, -379.78045654296875, -363.6893310546875, -347.59820556640625, -331.507080078125, -315.4159240722656, -299.3247985839844, -283.233642578125, -267.14251708984375, -251.05137634277344, -234.96023559570312, -218.86907958984375, -202.77793884277344, -186.68679809570312, -170.59567260742188, -154.5045166015625, -138.41339111328125, -122.32225036621094, -106.23110961914062, -90.13996887207031, -74.048828125, -57.95769119262695, -41.866554260253906, -25.775413513183594, -9.684272766113281, 6.4068603515625, 22.498001098632812, 38.589141845703125, 54.68028259277344, 70.77142333984375, 86.86255645751953, 102.95369720458984, 119.04483795166016, 135.13597106933594, 151.22711181640625, 167.31825256347656, 183.40939331054688, 199.5005340576172, 215.5916748046875, 231.68280029296875, 247.77395629882812, 263.8650817871094, 279.95623779296875, 296.04736328125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 8.0, 5.0, 16.0, 8.0, 18.0, 20.0, 28.0, 28.0, 19.0, 22.0, 29.0, 40.0, 46.0, 41.0, 43.0, 44.0, 34.0, 34.0, 37.0, 42.0, 45.0, 49.0, 35.0, 33.0, 27.0, 26.0, 30.0, 20.0, 24.0, 21.0, 15.0, 8.0, 15.0, 15.0, 11.0, 14.0, 7.0, 0.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-136.99783325195312, -132.920654296875, -128.84347534179688, -124.76631164550781, -120.68913269042969, -116.61195373535156, -112.53478240966797, -108.45761108398438, -104.38043212890625, -100.30325317382812, -96.22608184814453, -92.14891052246094, -88.07173156738281, -83.99455261230469, -79.9173812866211, -75.8402099609375, -71.76303100585938, -67.68585205078125, -63.608680725097656, -59.5315055847168, -55.45433044433594, -51.37715530395508, -47.29998016357422, -43.22280502319336, -39.1456298828125, -35.06845474243164, -30.99127960205078, -26.914104461669922, -22.836929321289062, -18.759754180908203, -14.682579040527344, -10.605403900146484, -6.528221130371094, -2.4510459899902344, 1.626129150390625, 5.703304290771484, 9.780479431152344, 13.857654571533203, 17.934829711914062, 22.012004852294922, 26.08917999267578, 30.16635513305664, 34.2435302734375, 38.32070541381836, 42.39788055419922, 46.47505569458008, 50.55223083496094, 54.6294059753418, 58.706581115722656, 62.783756256103516, 66.86093139648438, 70.9381103515625, 75.0152816772461, 79.09245300292969, 83.16963195800781, 87.24681091308594, 91.32398223876953, 95.40115356445312, 99.47833251953125, 103.55551147460938, 107.63268280029297, 111.70985412597656, 115.78703308105469, 119.86421203613281, 123.9413833618164]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 8.0, 8.0, 9.0, 7.0, 14.0, 20.0, 33.0, 45.0, 53.0, 82.0, 211.0, 344.0, 609.0, 1177.0, 2760.0, 6638.0, 17387.0, 55073.0, 287098.0, 3556693.0, 197355.0, 44065.0, 14474.0, 5596.0, 2320.0, 1056.0, 513.0, 282.0, 149.0, 85.0, 40.0, 20.0, 24.0, 8.0, 11.0, 9.0, 6.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-53.53125, -52.01953125, -50.5078125, -48.99609375, -47.484375, -45.97265625, -44.4609375, -42.94921875, -41.4375, -39.92578125, -38.4140625, -36.90234375, -35.390625, -33.87890625, -32.3671875, -30.85546875, -29.34375, -27.83203125, -26.3203125, -24.80859375, -23.296875, -21.78515625, -20.2734375, -18.76171875, -17.25, -15.73828125, -14.2265625, -12.71484375, -11.203125, -9.69140625, -8.1796875, -6.66796875, -5.15625, -3.64453125, -2.1328125, -0.62109375, 0.890625, 2.40234375, 3.9140625, 5.42578125, 6.9375, 8.44921875, 9.9609375, 11.47265625, 12.984375, 14.49609375, 16.0078125, 17.51953125, 19.03125, 20.54296875, 22.0546875, 23.56640625, 25.078125, 26.58984375, 28.1015625, 29.61328125, 31.125, 32.63671875, 34.1484375, 35.66015625, 37.171875, 38.68359375, 40.1953125, 41.70703125, 43.21875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 10.0, 12.0, 9.0, 16.0, 17.0, 21.0, 25.0, 37.0, 34.0, 32.0, 53.0, 53.0, 51.0, 51.0, 70.0, 58.0, 57.0, 56.0, 55.0, 51.0, 45.0, 33.0, 36.0, 29.0, 15.0, 17.0, 13.0, 14.0, 4.0, 6.0, 3.0, 5.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.45703125, -7.24420166015625, -7.0313720703125, -6.81854248046875, -6.605712890625, -6.39288330078125, -6.1800537109375, -5.96722412109375, -5.75439453125, -5.54156494140625, -5.3287353515625, -5.11590576171875, -4.903076171875, -4.69024658203125, -4.4774169921875, -4.26458740234375, -4.0517578125, -3.83892822265625, -3.6260986328125, -3.41326904296875, -3.200439453125, -2.98760986328125, -2.7747802734375, -2.56195068359375, -2.34912109375, -2.13629150390625, -1.9234619140625, -1.71063232421875, -1.497802734375, -1.28497314453125, -1.0721435546875, -0.85931396484375, -0.646484375, -0.43365478515625, -0.2208251953125, -0.00799560546875, 0.204833984375, 0.41766357421875, 0.6304931640625, 0.84332275390625, 1.05615234375, 1.26898193359375, 1.4818115234375, 1.69464111328125, 1.907470703125, 2.12030029296875, 2.3331298828125, 2.54595947265625, 2.7587890625, 2.97161865234375, 3.1844482421875, 3.39727783203125, 3.610107421875, 3.82293701171875, 4.0357666015625, 4.24859619140625, 4.46142578125, 4.67425537109375, 4.8870849609375, 5.09991455078125, 5.312744140625, 5.52557373046875, 5.7384033203125, 5.95123291015625, 6.1640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 8.0, 4.0, 7.0, 10.0, 8.0, 28.0, 26.0, 56.0, 49.0, 101.0, 112.0, 169.0, 259.0, 426.0, 649.0, 1035.0, 1796.0, 3025.0, 5376.0, 10109.0, 20782.0, 47356.0, 128416.0, 526775.0, 2957008.0, 322767.0, 93674.0, 36664.0, 17035.0, 8596.0, 4657.0, 2700.0, 1647.0, 969.0, 640.0, 400.0, 311.0, 181.0, 124.0, 100.0, 66.0, 46.0, 39.0, 18.0, 20.0, 11.0, 11.0, 5.0, 5.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-29.46875, -28.529052734375, -27.58935546875, -26.649658203125, -25.7099609375, -24.770263671875, -23.83056640625, -22.890869140625, -21.951171875, -21.011474609375, -20.07177734375, -19.132080078125, -18.1923828125, -17.252685546875, -16.31298828125, -15.373291015625, -14.43359375, -13.493896484375, -12.55419921875, -11.614501953125, -10.6748046875, -9.735107421875, -8.79541015625, -7.855712890625, -6.916015625, -5.976318359375, -5.03662109375, -4.096923828125, -3.1572265625, -2.217529296875, -1.27783203125, -0.338134765625, 0.6015625, 1.541259765625, 2.48095703125, 3.420654296875, 4.3603515625, 5.300048828125, 6.23974609375, 7.179443359375, 8.119140625, 9.058837890625, 9.99853515625, 10.938232421875, 11.8779296875, 12.817626953125, 13.75732421875, 14.697021484375, 15.63671875, 16.576416015625, 17.51611328125, 18.455810546875, 19.3955078125, 20.335205078125, 21.27490234375, 22.214599609375, 23.154296875, 24.093994140625, 25.03369140625, 25.973388671875, 26.9130859375, 27.852783203125, 28.79248046875, 29.732177734375, 30.671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 9.0, 21.0, 16.0, 19.0, 49.0, 47.0, 90.0, 86.0, 135.0, 200.0, 313.0, 1102.0, 999.0, 312.0, 178.0, 130.0, 77.0, 58.0, 32.0, 30.0, 31.0, 19.0, 15.0, 15.0, 13.0, 6.0, 6.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.1484375, -12.6785888671875, -12.208740234375, -11.7388916015625, -11.26904296875, -10.7991943359375, -10.329345703125, -9.8594970703125, -9.3896484375, -8.9197998046875, -8.449951171875, -7.9801025390625, -7.51025390625, -7.0404052734375, -6.570556640625, -6.1007080078125, -5.630859375, -5.1610107421875, -4.691162109375, -4.2213134765625, -3.75146484375, -3.2816162109375, -2.811767578125, -2.3419189453125, -1.8720703125, -1.4022216796875, -0.932373046875, -0.4625244140625, 0.00732421875, 0.4771728515625, 0.947021484375, 1.4168701171875, 1.88671875, 2.3565673828125, 2.826416015625, 3.2962646484375, 3.76611328125, 4.2359619140625, 4.705810546875, 5.1756591796875, 5.6455078125, 6.1153564453125, 6.585205078125, 7.0550537109375, 7.52490234375, 7.9947509765625, 8.464599609375, 8.9344482421875, 9.404296875, 9.8741455078125, 10.343994140625, 10.8138427734375, 11.28369140625, 11.7535400390625, 12.223388671875, 12.6932373046875, 13.1630859375, 13.6329345703125, 14.102783203125, 14.5726318359375, 15.04248046875, 15.5123291015625, 15.982177734375, 16.4520263671875, 16.921875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 7.0, 7.0, 15.0, 24.0, 48.0, 62.0, 100.0, 146.0, 183.0, 138.0, 101.0, 67.0, 41.0, 29.0, 16.0, 12.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.6975555419922, -159.95765686035156, -155.2177734375, -150.47787475585938, -145.73797607421875, -140.99807739257812, -136.2581787109375, -131.51829528808594, -126.77839660644531, -122.03849792480469, -117.2986068725586, -112.5587158203125, -107.81881713867188, -103.07891845703125, -98.33902740478516, -93.59913635253906, -88.85923767089844, -84.11933898925781, -79.37944793701172, -74.63955688476562, -69.899658203125, -65.15975952148438, -60.41986846923828, -55.67997360229492, -50.94007873535156, -46.2001838684082, -41.460289001464844, -36.720394134521484, -31.980499267578125, -27.240604400634766, -22.500709533691406, -17.760814666748047, -13.020904541015625, -8.281009674072266, -3.5411148071289062, 1.1987800598144531, 5.9386749267578125, 10.678569793701172, 15.418464660644531, 20.15835952758789, 24.89825439453125, 29.63814926147461, 34.37804412841797, 39.11793899536133, 43.85783386230469, 48.59772872924805, 53.337623596191406, 58.077518463134766, 62.817413330078125, 67.55731201171875, 72.29720306396484, 77.03709411621094, 81.77699279785156, 86.51689147949219, 91.25678253173828, 95.99667358398438, 100.736572265625, 105.47647094726562, 110.21636199951172, 114.95625305175781, 119.69615173339844, 124.43605041503906, 129.17593383789062, 133.91583251953125, 138.65573120117188]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 4.0, 8.0, 6.0, 10.0, 14.0, 7.0, 12.0, 14.0, 11.0, 19.0, 22.0, 18.0, 20.0, 26.0, 31.0, 26.0, 33.0, 34.0, 39.0, 40.0, 43.0, 41.0, 40.0, 36.0, 46.0, 39.0, 38.0, 27.0, 34.0, 29.0, 31.0, 32.0, 24.0, 19.0, 25.0, 7.0, 15.0, 18.0, 9.0, 13.0, 9.0, 13.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-53.023902893066406, -51.3731689453125, -49.722434997558594, -48.07170104980469, -46.42096710205078, -44.770233154296875, -43.11949920654297, -41.46876525878906, -39.818031311035156, -38.16729736328125, -36.516563415527344, -34.86582946777344, -33.21509552001953, -31.564361572265625, -29.91362953186035, -28.262895584106445, -26.612163543701172, -24.961429595947266, -23.31069564819336, -21.659961700439453, -20.009227752685547, -18.35849380493164, -16.707761764526367, -15.057027816772461, -13.406293869018555, -11.755559921264648, -10.104825973510742, -8.454092979431152, -6.803359031677246, -5.15262508392334, -3.50189208984375, -1.8511581420898438, -0.2004241943359375, 1.4503095149993896, 3.101043224334717, 4.751776695251465, 6.402510643005371, 8.053244590759277, 9.703977584838867, 11.354711532592773, 13.00544548034668, 14.656179428100586, 16.306913375854492, 17.957645416259766, 19.608379364013672, 21.259113311767578, 22.909847259521484, 24.56058120727539, 26.211315155029297, 27.862049102783203, 29.51278305053711, 31.163516998291016, 32.81425094604492, 34.46498489379883, 36.11571502685547, 37.766448974609375, 39.41718292236328, 41.06791687011719, 42.718650817871094, 44.369384765625, 46.020118713378906, 47.67085266113281, 49.32158660888672, 50.972320556640625, 52.62305450439453]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 18.0, 16.0, 20.0, 45.0, 51.0, 100.0, 150.0, 239.0, 472.0, 875.0, 1992.0, 4451.0, 11528.0, 32583.0, 103283.0, 377490.0, 364283.0, 99754.0, 31566.0, 11278.0, 4400.0, 1939.0, 934.0, 451.0, 243.0, 134.0, 83.0, 62.0, 40.0, 22.0, 17.0, 14.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.0625, -49.56005859375, -48.0576171875, -46.55517578125, -45.052734375, -43.55029296875, -42.0478515625, -40.54541015625, -39.04296875, -37.54052734375, -36.0380859375, -34.53564453125, -33.033203125, -31.53076171875, -30.0283203125, -28.52587890625, -27.0234375, -25.52099609375, -24.0185546875, -22.51611328125, -21.013671875, -19.51123046875, -18.0087890625, -16.50634765625, -15.00390625, -13.50146484375, -11.9990234375, -10.49658203125, -8.994140625, -7.49169921875, -5.9892578125, -4.48681640625, -2.984375, -1.48193359375, 0.0205078125, 1.52294921875, 3.025390625, 4.52783203125, 6.0302734375, 7.53271484375, 9.03515625, 10.53759765625, 12.0400390625, 13.54248046875, 15.044921875, 16.54736328125, 18.0498046875, 19.55224609375, 21.0546875, 22.55712890625, 24.0595703125, 25.56201171875, 27.064453125, 28.56689453125, 30.0693359375, 31.57177734375, 33.07421875, 34.57666015625, 36.0791015625, 37.58154296875, 39.083984375, 40.58642578125, 42.0888671875, 43.59130859375, 45.09375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 3.0, 10.0, 12.0, 15.0, 17.0, 12.0, 25.0, 24.0, 34.0, 42.0, 35.0, 42.0, 35.0, 50.0, 62.0, 49.0, 55.0, 62.0, 53.0, 52.0, 43.0, 45.0, 45.0, 30.0, 24.0, 25.0, 15.0, 16.0, 13.0, 11.0, 5.0, 9.0, 3.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.02734375, -5.82806396484375, -5.6287841796875, -5.42950439453125, -5.230224609375, -5.03094482421875, -4.8316650390625, -4.63238525390625, -4.43310546875, -4.23382568359375, -4.0345458984375, -3.83526611328125, -3.635986328125, -3.43670654296875, -3.2374267578125, -3.03814697265625, -2.8388671875, -2.63958740234375, -2.4403076171875, -2.24102783203125, -2.041748046875, -1.84246826171875, -1.6431884765625, -1.44390869140625, -1.24462890625, -1.04534912109375, -0.8460693359375, -0.64678955078125, -0.447509765625, -0.24822998046875, -0.0489501953125, 0.15032958984375, 0.349609375, 0.54888916015625, 0.7481689453125, 0.94744873046875, 1.146728515625, 1.34600830078125, 1.5452880859375, 1.74456787109375, 1.94384765625, 2.14312744140625, 2.3424072265625, 2.54168701171875, 2.740966796875, 2.94024658203125, 3.1395263671875, 3.33880615234375, 3.5380859375, 3.73736572265625, 3.9366455078125, 4.13592529296875, 4.335205078125, 4.53448486328125, 4.7337646484375, 4.93304443359375, 5.13232421875, 5.33160400390625, 5.5308837890625, 5.73016357421875, 5.929443359375, 6.12872314453125, 6.3280029296875, 6.52728271484375, 6.7265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 11.0, 11.0, 18.0, 27.0, 39.0, 68.0, 86.0, 157.0, 246.0, 444.0, 778.0, 1293.0, 2520.0, 5012.0, 11777.0, 30295.0, 85781.0, 274777.0, 423919.0, 134443.0, 45696.0, 16878.0, 7022.0, 3297.0, 1684.0, 914.0, 537.0, 302.0, 175.0, 133.0, 65.0, 43.0, 30.0, 25.0, 13.0, 18.0, 6.0, 5.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.125, -30.98583984375, -29.8466796875, -28.70751953125, -27.568359375, -26.42919921875, -25.2900390625, -24.15087890625, -23.01171875, -21.87255859375, -20.7333984375, -19.59423828125, -18.455078125, -17.31591796875, -16.1767578125, -15.03759765625, -13.8984375, -12.75927734375, -11.6201171875, -10.48095703125, -9.341796875, -8.20263671875, -7.0634765625, -5.92431640625, -4.78515625, -3.64599609375, -2.5068359375, -1.36767578125, -0.228515625, 0.91064453125, 2.0498046875, 3.18896484375, 4.328125, 5.46728515625, 6.6064453125, 7.74560546875, 8.884765625, 10.02392578125, 11.1630859375, 12.30224609375, 13.44140625, 14.58056640625, 15.7197265625, 16.85888671875, 17.998046875, 19.13720703125, 20.2763671875, 21.41552734375, 22.5546875, 23.69384765625, 24.8330078125, 25.97216796875, 27.111328125, 28.25048828125, 29.3896484375, 30.52880859375, 31.66796875, 32.80712890625, 33.9462890625, 35.08544921875, 36.224609375, 37.36376953125, 38.5029296875, 39.64208984375, 40.78125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 5.0, 15.0, 12.0, 20.0, 23.0, 21.0, 27.0, 34.0, 39.0, 40.0, 48.0, 38.0, 64.0, 43.0, 64.0, 59.0, 58.0, 57.0, 35.0, 42.0, 35.0, 29.0, 30.0, 29.0, 25.0, 19.0, 23.0, 9.0, 11.0, 9.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.15625, -28.10595703125, -27.0556640625, -26.00537109375, -24.955078125, -23.90478515625, -22.8544921875, -21.80419921875, -20.75390625, -19.70361328125, -18.6533203125, -17.60302734375, -16.552734375, -15.50244140625, -14.4521484375, -13.40185546875, -12.3515625, -11.30126953125, -10.2509765625, -9.20068359375, -8.150390625, -7.10009765625, -6.0498046875, -4.99951171875, -3.94921875, -2.89892578125, -1.8486328125, -0.79833984375, 0.251953125, 1.30224609375, 2.3525390625, 3.40283203125, 4.453125, 5.50341796875, 6.5537109375, 7.60400390625, 8.654296875, 9.70458984375, 10.7548828125, 11.80517578125, 12.85546875, 13.90576171875, 14.9560546875, 16.00634765625, 17.056640625, 18.10693359375, 19.1572265625, 20.20751953125, 21.2578125, 22.30810546875, 23.3583984375, 24.40869140625, 25.458984375, 26.50927734375, 27.5595703125, 28.60986328125, 29.66015625, 30.71044921875, 31.7607421875, 32.81103515625, 33.861328125, 34.91162109375, 35.9619140625, 37.01220703125, 38.0625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 9.0, 9.0, 15.0, 28.0, 45.0, 76.0, 95.0, 171.0, 326.0, 594.0, 1271.0, 2672.0, 6970.0, 26457.0, 216110.0, 685800.0, 84330.0, 14701.0, 4837.0, 1957.0, 948.0, 495.0, 262.0, 138.0, 86.0, 59.0, 44.0, 10.0, 12.0, 14.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.390625, -30.387939453125, -29.38525390625, -28.382568359375, -27.3798828125, -26.377197265625, -25.37451171875, -24.371826171875, -23.369140625, -22.366455078125, -21.36376953125, -20.361083984375, -19.3583984375, -18.355712890625, -17.35302734375, -16.350341796875, -15.34765625, -14.344970703125, -13.34228515625, -12.339599609375, -11.3369140625, -10.334228515625, -9.33154296875, -8.328857421875, -7.326171875, -6.323486328125, -5.32080078125, -4.318115234375, -3.3154296875, -2.312744140625, -1.31005859375, -0.307373046875, 0.6953125, 1.697998046875, 2.70068359375, 3.703369140625, 4.7060546875, 5.708740234375, 6.71142578125, 7.714111328125, 8.716796875, 9.719482421875, 10.72216796875, 11.724853515625, 12.7275390625, 13.730224609375, 14.73291015625, 15.735595703125, 16.73828125, 17.740966796875, 18.74365234375, 19.746337890625, 20.7490234375, 21.751708984375, 22.75439453125, 23.757080078125, 24.759765625, 25.762451171875, 26.76513671875, 27.767822265625, 28.7705078125, 29.773193359375, 30.77587890625, 31.778564453125, 32.78125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 12.0, 20.0, 30.0, 73.0, 165.0, 293.0, 226.0, 82.0, 39.0, 14.0, 13.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01534271240234375, -0.014990806579589844, -0.014638900756835938, -0.014286994934082031, -0.013935089111328125, -0.013583183288574219, -0.013231277465820312, -0.012879371643066406, -0.0125274658203125, -0.012175559997558594, -0.011823654174804688, -0.011471748352050781, -0.011119842529296875, -0.010767936706542969, -0.010416030883789062, -0.010064125061035156, -0.00971221923828125, -0.009360313415527344, -0.009008407592773438, -0.008656501770019531, -0.008304595947265625, -0.007952690124511719, -0.0076007843017578125, -0.007248878479003906, -0.00689697265625, -0.006545066833496094, -0.0061931610107421875, -0.005841255187988281, -0.005489349365234375, -0.005137443542480469, -0.0047855377197265625, -0.004433631896972656, -0.00408172607421875, -0.0037298202514648438, -0.0033779144287109375, -0.0030260086059570312, -0.002674102783203125, -0.0023221969604492188, -0.0019702911376953125, -0.0016183853149414062, -0.0012664794921875, -0.0009145736694335938, -0.0005626678466796875, -0.00021076202392578125, 0.000141143798828125, 0.0004930496215820312, 0.0008449554443359375, 0.0011968612670898438, 0.00154876708984375, 0.0019006729125976562, 0.0022525787353515625, 0.0026044845581054688, 0.002956390380859375, 0.0033082962036132812, 0.0036602020263671875, 0.004012107849121094, 0.004364013671875, 0.004715919494628906, 0.0050678253173828125, 0.005419731140136719, 0.005771636962890625, 0.006123542785644531, 0.0064754486083984375, 0.006827354431152344, 0.00717926025390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 0.0, 7.0, 10.0, 8.0, 18.0, 26.0, 29.0, 32.0, 66.0, 96.0, 219.0, 483.0, 1273.0, 4264.0, 18873.0, 207185.0, 753871.0, 49893.0, 8553.0, 2228.0, 759.0, 293.0, 133.0, 84.0, 47.0, 31.0, 16.0, 21.0, 11.0, 14.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.0830078125, -37.791015625, -36.4990234375, -35.20703125, -33.9150390625, -32.623046875, -31.3310546875, -30.0390625, -28.7470703125, -27.455078125, -26.1630859375, -24.87109375, -23.5791015625, -22.287109375, -20.9951171875, -19.703125, -18.4111328125, -17.119140625, -15.8271484375, -14.53515625, -13.2431640625, -11.951171875, -10.6591796875, -9.3671875, -8.0751953125, -6.783203125, -5.4912109375, -4.19921875, -2.9072265625, -1.615234375, -0.3232421875, 0.96875, 2.2607421875, 3.552734375, 4.8447265625, 6.13671875, 7.4287109375, 8.720703125, 10.0126953125, 11.3046875, 12.5966796875, 13.888671875, 15.1806640625, 16.47265625, 17.7646484375, 19.056640625, 20.3486328125, 21.640625, 22.9326171875, 24.224609375, 25.5166015625, 26.80859375, 28.1005859375, 29.392578125, 30.6845703125, 31.9765625, 33.2685546875, 34.560546875, 35.8525390625, 37.14453125, 38.4365234375, 39.728515625, 41.0205078125, 42.3125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 15.0, 28.0, 38.0, 84.0, 139.0, 147.0, 182.0, 128.0, 69.0, 59.0, 29.0, 14.0, 18.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9296875, -13.1529541015625, -12.376220703125, -11.5994873046875, -10.82275390625, -10.0460205078125, -9.269287109375, -8.4925537109375, -7.7158203125, -6.9390869140625, -6.162353515625, -5.3856201171875, -4.60888671875, -3.8321533203125, -3.055419921875, -2.2786865234375, -1.501953125, -0.7252197265625, 0.051513671875, 0.8282470703125, 1.60498046875, 2.3817138671875, 3.158447265625, 3.9351806640625, 4.7119140625, 5.4886474609375, 6.265380859375, 7.0421142578125, 7.81884765625, 8.5955810546875, 9.372314453125, 10.1490478515625, 10.92578125, 11.7025146484375, 12.479248046875, 13.2559814453125, 14.03271484375, 14.8094482421875, 15.586181640625, 16.3629150390625, 17.1396484375, 17.9163818359375, 18.693115234375, 19.4698486328125, 20.24658203125, 21.0233154296875, 21.800048828125, 22.5767822265625, 23.353515625, 24.1302490234375, 24.906982421875, 25.6837158203125, 26.46044921875, 27.2371826171875, 28.013916015625, 28.7906494140625, 29.5673828125, 30.3441162109375, 31.120849609375, 31.8975830078125, 32.67431640625, 33.4510498046875, 34.227783203125, 35.0045166015625, 35.78125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 11.0, 10.0, 8.0, 16.0, 34.0, 43.0, 55.0, 71.0, 94.0, 113.0, 138.0, 103.0, 88.0, 76.0, 50.0, 24.0, 18.0, 18.0, 12.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.0894775390625, -247.854736328125, -239.6199951171875, -231.38525390625, -223.15049743652344, -214.91575622558594, -206.68101501464844, -198.44627380371094, -190.21151733398438, -181.97677612304688, -173.74203491210938, -165.50729370117188, -157.2725372314453, -149.0377960205078, -140.8030548095703, -132.5683135986328, -124.33357238769531, -116.09883117675781, -107.86408233642578, -99.62934112548828, -91.39459228515625, -83.15985107421875, -74.92510986328125, -66.69036865234375, -58.45561981201172, -50.22087478637695, -41.98612976074219, -33.75138854980469, -25.516643524169922, -17.281898498535156, -9.047157287597656, -0.8124122619628906, 7.422332763671875, 15.657076835632324, 23.891820907592773, 32.126564025878906, 40.36130905151367, 48.59605407714844, 56.83079528808594, 65.06553649902344, 73.30028533935547, 81.53502655029297, 89.769775390625, 98.0045166015625, 106.2392578125, 114.47400665283203, 122.70874786376953, 130.94349670410156, 139.17823791503906, 147.41297912597656, 155.64772033691406, 163.88247680664062, 172.11721801757812, 180.35195922851562, 188.58670043945312, 196.82144165039062, 205.05618286132812, 213.29092407226562, 221.52566528320312, 229.76040649414062, 237.9951629638672, 246.2299041748047, 254.4646453857422, 262.69940185546875, 270.93414306640625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 3.0, 5.0, 5.0, 13.0, 10.0, 10.0, 17.0, 12.0, 19.0, 22.0, 26.0, 30.0, 23.0, 23.0, 35.0, 26.0, 34.0, 38.0, 43.0, 48.0, 46.0, 39.0, 42.0, 40.0, 41.0, 30.0, 43.0, 29.0, 27.0, 45.0, 21.0, 21.0, 15.0, 20.0, 15.0, 15.0, 13.0, 18.0, 5.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.3483428955078, -152.33303833007812, -147.31773376464844, -142.3024139404297, -137.287109375, -132.2718048095703, -127.25650024414062, -122.24119567871094, -117.22588348388672, -112.21057891845703, -107.19526672363281, -102.17996215820312, -97.16465759277344, -92.14934539794922, -87.13404083251953, -82.11872863769531, -77.10342407226562, -72.08811950683594, -67.07280731201172, -62.05750274658203, -57.04219436645508, -52.026885986328125, -47.01158142089844, -41.996273040771484, -36.98096466064453, -31.965656280517578, -26.950349807739258, -21.935043334960938, -16.919734954833984, -11.904426574707031, -6.889120101928711, -1.8738136291503906, 3.1414947509765625, 8.1568021774292, 13.172109603881836, 18.187416076660156, 23.20272445678711, 28.218032836914062, 33.23333740234375, 38.2486457824707, 43.263954162597656, 48.27926254272461, 53.29457092285156, 58.30987548828125, 63.3251838684082, 68.34049224853516, 73.35579681396484, 78.37110900878906, 83.38641357421875, 88.40171813964844, 93.41703033447266, 98.43233489990234, 103.44764709472656, 108.46295166015625, 113.47825622558594, 118.49356079101562, 123.50887298583984, 128.52418518066406, 133.53948974609375, 138.55479431152344, 143.57009887695312, 148.58541870117188, 153.60072326660156, 158.61602783203125, 163.63133239746094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 1.0, 8.0, 9.0, 7.0, 13.0, 11.0, 19.0, 31.0, 36.0, 50.0, 63.0, 90.0, 127.0, 200.0, 297.0, 451.0, 627.0, 1018.0, 1594.0, 2755.0, 4804.0, 9020.0, 18885.0, 47462.0, 182228.0, 3613362.0, 215585.0, 52137.0, 20819.0, 9798.0, 5069.0, 2837.0, 1707.0, 1064.0, 676.0, 420.0, 292.0, 216.0, 158.0, 97.0, 72.0, 42.0, 42.0, 27.0, 17.0, 6.0, 14.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.15625, -36.98388671875, -35.8115234375, -34.63916015625, -33.466796875, -32.29443359375, -31.1220703125, -29.94970703125, -28.77734375, -27.60498046875, -26.4326171875, -25.26025390625, -24.087890625, -22.91552734375, -21.7431640625, -20.57080078125, -19.3984375, -18.22607421875, -17.0537109375, -15.88134765625, -14.708984375, -13.53662109375, -12.3642578125, -11.19189453125, -10.01953125, -8.84716796875, -7.6748046875, -6.50244140625, -5.330078125, -4.15771484375, -2.9853515625, -1.81298828125, -0.640625, 0.53173828125, 1.7041015625, 2.87646484375, 4.048828125, 5.22119140625, 6.3935546875, 7.56591796875, 8.73828125, 9.91064453125, 11.0830078125, 12.25537109375, 13.427734375, 14.60009765625, 15.7724609375, 16.94482421875, 18.1171875, 19.28955078125, 20.4619140625, 21.63427734375, 22.806640625, 23.97900390625, 25.1513671875, 26.32373046875, 27.49609375, 28.66845703125, 29.8408203125, 31.01318359375, 32.185546875, 33.35791015625, 34.5302734375, 35.70263671875, 36.875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 7.0, 13.0, 11.0, 19.0, 26.0, 22.0, 33.0, 30.0, 41.0, 50.0, 63.0, 67.0, 46.0, 70.0, 62.0, 56.0, 57.0, 49.0, 40.0, 40.0, 44.0, 23.0, 20.0, 17.0, 22.0, 17.0, 6.0, 12.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.83197021484375, -7.5858154296875, -7.33966064453125, -7.093505859375, -6.84735107421875, -6.6011962890625, -6.35504150390625, -6.10888671875, -5.86273193359375, -5.6165771484375, -5.37042236328125, -5.124267578125, -4.87811279296875, -4.6319580078125, -4.38580322265625, -4.1396484375, -3.89349365234375, -3.6473388671875, -3.40118408203125, -3.155029296875, -2.90887451171875, -2.6627197265625, -2.41656494140625, -2.17041015625, -1.92425537109375, -1.6781005859375, -1.43194580078125, -1.185791015625, -0.93963623046875, -0.6934814453125, -0.44732666015625, -0.201171875, 0.04498291015625, 0.2911376953125, 0.53729248046875, 0.783447265625, 1.02960205078125, 1.2757568359375, 1.52191162109375, 1.76806640625, 2.01422119140625, 2.2603759765625, 2.50653076171875, 2.752685546875, 2.99884033203125, 3.2449951171875, 3.49114990234375, 3.7373046875, 3.98345947265625, 4.2296142578125, 4.47576904296875, 4.721923828125, 4.96807861328125, 5.2142333984375, 5.46038818359375, 5.70654296875, 5.95269775390625, 6.1988525390625, 6.44500732421875, 6.691162109375, 6.93731689453125, 7.1834716796875, 7.42962646484375, 7.67578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 13.0, 11.0, 16.0, 14.0, 14.0, 29.0, 41.0, 40.0, 59.0, 70.0, 128.0, 173.0, 301.0, 532.0, 1241.0, 3288.0, 10633.0, 49090.0, 1468107.0, 2592680.0, 50599.0, 11171.0, 3273.0, 1282.0, 554.0, 280.0, 169.0, 122.0, 73.0, 54.0, 48.0, 39.0, 26.0, 17.0, 16.0, 16.0, 10.0, 8.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.125, -80.4443359375, -77.763671875, -75.0830078125, -72.40234375, -69.7216796875, -67.041015625, -64.3603515625, -61.6796875, -58.9990234375, -56.318359375, -53.6376953125, -50.95703125, -48.2763671875, -45.595703125, -42.9150390625, -40.234375, -37.5537109375, -34.873046875, -32.1923828125, -29.51171875, -26.8310546875, -24.150390625, -21.4697265625, -18.7890625, -16.1083984375, -13.427734375, -10.7470703125, -8.06640625, -5.3857421875, -2.705078125, -0.0244140625, 2.65625, 5.3369140625, 8.017578125, 10.6982421875, 13.37890625, 16.0595703125, 18.740234375, 21.4208984375, 24.1015625, 26.7822265625, 29.462890625, 32.1435546875, 34.82421875, 37.5048828125, 40.185546875, 42.8662109375, 45.546875, 48.2275390625, 50.908203125, 53.5888671875, 56.26953125, 58.9501953125, 61.630859375, 64.3115234375, 66.9921875, 69.6728515625, 72.353515625, 75.0341796875, 77.71484375, 80.3955078125, 83.076171875, 85.7568359375, 88.4375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 9.0, 9.0, 15.0, 22.0, 36.0, 48.0, 114.0, 301.0, 2643.0, 532.0, 168.0, 80.0, 34.0, 30.0, 19.0, 9.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-47.84375, -46.74853515625, -45.6533203125, -44.55810546875, -43.462890625, -42.36767578125, -41.2724609375, -40.17724609375, -39.08203125, -37.98681640625, -36.8916015625, -35.79638671875, -34.701171875, -33.60595703125, -32.5107421875, -31.41552734375, -30.3203125, -29.22509765625, -28.1298828125, -27.03466796875, -25.939453125, -24.84423828125, -23.7490234375, -22.65380859375, -21.55859375, -20.46337890625, -19.3681640625, -18.27294921875, -17.177734375, -16.08251953125, -14.9873046875, -13.89208984375, -12.796875, -11.70166015625, -10.6064453125, -9.51123046875, -8.416015625, -7.32080078125, -6.2255859375, -5.13037109375, -4.03515625, -2.93994140625, -1.8447265625, -0.74951171875, 0.345703125, 1.44091796875, 2.5361328125, 3.63134765625, 4.7265625, 5.82177734375, 6.9169921875, 8.01220703125, 9.107421875, 10.20263671875, 11.2978515625, 12.39306640625, 13.48828125, 14.58349609375, 15.6787109375, 16.77392578125, 17.869140625, 18.96435546875, 20.0595703125, 21.15478515625, 22.25]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 6.0, 12.0, 14.0, 10.0, 38.0, 45.0, 49.0, 88.0, 87.0, 132.0, 132.0, 101.0, 83.0, 56.0, 39.0, 29.0, 18.0, 12.0, 9.0, 11.0, 6.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-143.51214599609375, -140.02114868164062, -136.53013610839844, -133.03912353515625, -129.54812622070312, -126.05712127685547, -122.56611633300781, -119.07511138916016, -115.5841064453125, -112.09310150146484, -108.60209655761719, -105.11109161376953, -101.62008666992188, -98.12908172607422, -94.63807678222656, -91.1470718383789, -87.65606689453125, -84.1650619506836, -80.67405700683594, -77.18305206298828, -73.69204711914062, -70.20104217529297, -66.71003723144531, -63.219032287597656, -59.72802734375, -56.237022399902344, -52.74601745605469, -49.25501251220703, -45.764007568359375, -42.27300262451172, -38.78199768066406, -35.290992736816406, -31.79998779296875, -28.308982849121094, -24.817977905273438, -21.32697296142578, -17.835968017578125, -14.344963073730469, -10.853958129882812, -7.362953186035156, -3.8719482421875, -0.38094329833984375, 3.1100616455078125, 6.601066589355469, 10.092071533203125, 13.583076477050781, 17.074081420898438, 20.565086364746094, 24.05609130859375, 27.547096252441406, 31.038101196289062, 34.52910614013672, 38.020111083984375, 41.51111602783203, 45.00212097167969, 48.493125915527344, 51.984130859375, 55.475135803222656, 58.96614074707031, 62.45714569091797, 65.94815063476562, 69.43915557861328, 72.93016052246094, 76.4211654663086, 79.91217041015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 5.0, 15.0, 15.0, 25.0, 15.0, 27.0, 41.0, 39.0, 51.0, 42.0, 58.0, 64.0, 70.0, 62.0, 68.0, 66.0, 66.0, 57.0, 49.0, 36.0, 35.0, 28.0, 17.0, 16.0, 13.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.21607971191406, -96.05860137939453, -92.901123046875, -89.74364471435547, -86.58616638183594, -83.4286880493164, -80.27120971679688, -77.11373138427734, -73.95625305175781, -70.79877471923828, -67.64129638671875, -64.48381805419922, -61.32633972167969, -58.168861389160156, -55.011383056640625, -51.853904724121094, -48.69643020629883, -45.5389518737793, -42.381473541259766, -39.223995208740234, -36.0665168762207, -32.90903854370117, -29.751562118530273, -26.594083786010742, -23.43660545349121, -20.27912712097168, -17.12164878845215, -13.964171409606934, -10.806693077087402, -7.649214744567871, -4.491737365722656, -1.334259033203125, 1.8232192993164062, 4.9806976318359375, 8.138175964355469, 11.295653343200684, 14.453131675720215, 17.610610961914062, 20.76808738708496, 23.925565719604492, 27.083044052124023, 30.240522384643555, 33.39799880981445, 36.555477142333984, 39.712955474853516, 42.87043380737305, 46.02791213989258, 49.18539047241211, 52.34286880493164, 55.50034713745117, 58.6578254699707, 61.815303802490234, 64.9727783203125, 68.13025665283203, 71.28773498535156, 74.4452133178711, 77.60269165039062, 80.76016998291016, 83.91764831542969, 87.07512664794922, 90.23260498046875, 93.39008331298828, 96.54756164550781, 99.70503997802734, 102.86251831054688]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 13.0, 11.0, 20.0, 47.0, 38.0, 95.0, 120.0, 194.0, 309.0, 632.0, 1120.0, 2051.0, 3879.0, 7826.0, 16601.0, 36770.0, 86855.0, 226346.0, 385835.0, 162083.0, 64195.0, 27732.0, 12814.0, 6045.0, 3060.0, 1581.0, 916.0, 533.0, 293.0, 183.0, 120.0, 78.0, 52.0, 27.0, 23.0, 17.0, 11.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.46826171875, -31.2802734375, -30.09228515625, -28.904296875, -27.71630859375, -26.5283203125, -25.34033203125, -24.15234375, -22.96435546875, -21.7763671875, -20.58837890625, -19.400390625, -18.21240234375, -17.0244140625, -15.83642578125, -14.6484375, -13.46044921875, -12.2724609375, -11.08447265625, -9.896484375, -8.70849609375, -7.5205078125, -6.33251953125, -5.14453125, -3.95654296875, -2.7685546875, -1.58056640625, -0.392578125, 0.79541015625, 1.9833984375, 3.17138671875, 4.359375, 5.54736328125, 6.7353515625, 7.92333984375, 9.111328125, 10.29931640625, 11.4873046875, 12.67529296875, 13.86328125, 15.05126953125, 16.2392578125, 17.42724609375, 18.615234375, 19.80322265625, 20.9912109375, 22.17919921875, 23.3671875, 24.55517578125, 25.7431640625, 26.93115234375, 28.119140625, 29.30712890625, 30.4951171875, 31.68310546875, 32.87109375, 34.05908203125, 35.2470703125, 36.43505859375, 37.623046875, 38.81103515625, 39.9990234375, 41.18701171875, 42.375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 4.0, 10.0, 12.0, 6.0, 13.0, 12.0, 19.0, 21.0, 18.0, 20.0, 31.0, 27.0, 36.0, 55.0, 45.0, 36.0, 42.0, 43.0, 55.0, 48.0, 46.0, 42.0, 49.0, 43.0, 21.0, 24.0, 32.0, 25.0, 24.0, 25.0, 20.0, 17.0, 13.0, 13.0, 13.0, 10.0, 10.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3046875, -6.10009765625, -5.8955078125, -5.69091796875, -5.486328125, -5.28173828125, -5.0771484375, -4.87255859375, -4.66796875, -4.46337890625, -4.2587890625, -4.05419921875, -3.849609375, -3.64501953125, -3.4404296875, -3.23583984375, -3.03125, -2.82666015625, -2.6220703125, -2.41748046875, -2.212890625, -2.00830078125, -1.8037109375, -1.59912109375, -1.39453125, -1.18994140625, -0.9853515625, -0.78076171875, -0.576171875, -0.37158203125, -0.1669921875, 0.03759765625, 0.2421875, 0.44677734375, 0.6513671875, 0.85595703125, 1.060546875, 1.26513671875, 1.4697265625, 1.67431640625, 1.87890625, 2.08349609375, 2.2880859375, 2.49267578125, 2.697265625, 2.90185546875, 3.1064453125, 3.31103515625, 3.515625, 3.72021484375, 3.9248046875, 4.12939453125, 4.333984375, 4.53857421875, 4.7431640625, 4.94775390625, 5.15234375, 5.35693359375, 5.5615234375, 5.76611328125, 5.970703125, 6.17529296875, 6.3798828125, 6.58447265625, 6.7890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 11.0, 11.0, 11.0, 18.0, 14.0, 36.0, 49.0, 81.0, 110.0, 161.0, 220.0, 394.0, 569.0, 976.0, 1602.0, 2919.0, 5879.0, 11430.0, 24759.0, 56053.0, 139399.0, 357677.0, 266490.0, 100040.0, 41257.0, 18713.0, 9083.0, 4582.0, 2376.0, 1395.0, 795.0, 483.0, 324.0, 215.0, 131.0, 87.0, 59.0, 45.0, 25.0, 22.0, 11.0, 7.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.609375, -25.74609375, -24.8828125, -24.01953125, -23.15625, -22.29296875, -21.4296875, -20.56640625, -19.703125, -18.83984375, -17.9765625, -17.11328125, -16.25, -15.38671875, -14.5234375, -13.66015625, -12.796875, -11.93359375, -11.0703125, -10.20703125, -9.34375, -8.48046875, -7.6171875, -6.75390625, -5.890625, -5.02734375, -4.1640625, -3.30078125, -2.4375, -1.57421875, -0.7109375, 0.15234375, 1.015625, 1.87890625, 2.7421875, 3.60546875, 4.46875, 5.33203125, 6.1953125, 7.05859375, 7.921875, 8.78515625, 9.6484375, 10.51171875, 11.375, 12.23828125, 13.1015625, 13.96484375, 14.828125, 15.69140625, 16.5546875, 17.41796875, 18.28125, 19.14453125, 20.0078125, 20.87109375, 21.734375, 22.59765625, 23.4609375, 24.32421875, 25.1875, 26.05078125, 26.9140625, 27.77734375, 28.640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 5.0, 3.0, 3.0, 11.0, 14.0, 19.0, 15.0, 18.0, 22.0, 28.0, 30.0, 35.0, 46.0, 41.0, 53.0, 39.0, 42.0, 51.0, 49.0, 61.0, 35.0, 40.0, 43.0, 36.0, 36.0, 37.0, 24.0, 30.0, 13.0, 24.0, 16.0, 11.0, 16.0, 9.0, 13.0, 7.0, 8.0, 6.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.78125, -25.81982421875, -24.8583984375, -23.89697265625, -22.935546875, -21.97412109375, -21.0126953125, -20.05126953125, -19.08984375, -18.12841796875, -17.1669921875, -16.20556640625, -15.244140625, -14.28271484375, -13.3212890625, -12.35986328125, -11.3984375, -10.43701171875, -9.4755859375, -8.51416015625, -7.552734375, -6.59130859375, -5.6298828125, -4.66845703125, -3.70703125, -2.74560546875, -1.7841796875, -0.82275390625, 0.138671875, 1.10009765625, 2.0615234375, 3.02294921875, 3.984375, 4.94580078125, 5.9072265625, 6.86865234375, 7.830078125, 8.79150390625, 9.7529296875, 10.71435546875, 11.67578125, 12.63720703125, 13.5986328125, 14.56005859375, 15.521484375, 16.48291015625, 17.4443359375, 18.40576171875, 19.3671875, 20.32861328125, 21.2900390625, 22.25146484375, 23.212890625, 24.17431640625, 25.1357421875, 26.09716796875, 27.05859375, 28.02001953125, 28.9814453125, 29.94287109375, 30.904296875, 31.86572265625, 32.8271484375, 33.78857421875, 34.75]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 10.0, 22.0, 19.0, 31.0, 54.0, 100.0, 145.0, 242.0, 357.0, 595.0, 1008.0, 1992.0, 4135.0, 11513.0, 45642.0, 296493.0, 556064.0, 97893.0, 19912.0, 6309.0, 2714.0, 1291.0, 774.0, 473.0, 306.0, 178.0, 99.0, 56.0, 41.0, 25.0, 14.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.0, -27.267333984375, -26.53466796875, -25.802001953125, -25.0693359375, -24.336669921875, -23.60400390625, -22.871337890625, -22.138671875, -21.406005859375, -20.67333984375, -19.940673828125, -19.2080078125, -18.475341796875, -17.74267578125, -17.010009765625, -16.27734375, -15.544677734375, -14.81201171875, -14.079345703125, -13.3466796875, -12.614013671875, -11.88134765625, -11.148681640625, -10.416015625, -9.683349609375, -8.95068359375, -8.218017578125, -7.4853515625, -6.752685546875, -6.02001953125, -5.287353515625, -4.5546875, -3.822021484375, -3.08935546875, -2.356689453125, -1.6240234375, -0.891357421875, -0.15869140625, 0.573974609375, 1.306640625, 2.039306640625, 2.77197265625, 3.504638671875, 4.2373046875, 4.969970703125, 5.70263671875, 6.435302734375, 7.16796875, 7.900634765625, 8.63330078125, 9.365966796875, 10.0986328125, 10.831298828125, 11.56396484375, 12.296630859375, 13.029296875, 13.761962890625, 14.49462890625, 15.227294921875, 15.9599609375, 16.692626953125, 17.42529296875, 18.157958984375, 18.890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 10.0, 14.0, 28.0, 54.0, 120.0, 286.0, 256.0, 122.0, 43.0, 16.0, 7.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0139617919921875, -0.01358342170715332, -0.01320505142211914, -0.012826681137084961, -0.012448310852050781, -0.012069940567016602, -0.011691570281982422, -0.011313199996948242, -0.010934829711914062, -0.010556459426879883, -0.010178089141845703, -0.009799718856811523, -0.009421348571777344, -0.009042978286743164, -0.008664608001708984, -0.008286237716674805, -0.007907867431640625, -0.007529497146606445, -0.007151126861572266, -0.006772756576538086, -0.006394386291503906, -0.0060160160064697266, -0.005637645721435547, -0.005259275436401367, -0.0048809051513671875, -0.004502534866333008, -0.004124164581298828, -0.0037457942962646484, -0.0033674240112304688, -0.002989053726196289, -0.0026106834411621094, -0.0022323131561279297, -0.00185394287109375, -0.0014755725860595703, -0.0010972023010253906, -0.0007188320159912109, -0.00034046173095703125, 3.790855407714844e-05, 0.0004162788391113281, 0.0007946491241455078, 0.0011730194091796875, 0.0015513896942138672, 0.0019297599792480469, 0.0023081302642822266, 0.0026865005493164062, 0.003064870834350586, 0.0034432411193847656, 0.0038216114044189453, 0.004199981689453125, 0.004578351974487305, 0.004956722259521484, 0.005335092544555664, 0.005713462829589844, 0.0060918331146240234, 0.006470203399658203, 0.006848573684692383, 0.0072269439697265625, 0.007605314254760742, 0.007983684539794922, 0.008362054824829102, 0.008740425109863281, 0.009118795394897461, 0.00949716567993164, 0.00987553596496582, 0.01025390625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 10.0, 17.0, 24.0, 21.0, 42.0, 49.0, 68.0, 107.0, 162.0, 242.0, 459.0, 813.0, 1766.0, 4330.0, 16814.0, 130442.0, 738636.0, 129846.0, 16230.0, 4549.0, 1814.0, 903.0, 446.0, 240.0, 160.0, 117.0, 58.0, 49.0, 46.0, 26.0, 18.0, 10.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.53125, -28.56298828125, -27.5947265625, -26.62646484375, -25.658203125, -24.68994140625, -23.7216796875, -22.75341796875, -21.78515625, -20.81689453125, -19.8486328125, -18.88037109375, -17.912109375, -16.94384765625, -15.9755859375, -15.00732421875, -14.0390625, -13.07080078125, -12.1025390625, -11.13427734375, -10.166015625, -9.19775390625, -8.2294921875, -7.26123046875, -6.29296875, -5.32470703125, -4.3564453125, -3.38818359375, -2.419921875, -1.45166015625, -0.4833984375, 0.48486328125, 1.453125, 2.42138671875, 3.3896484375, 4.35791015625, 5.326171875, 6.29443359375, 7.2626953125, 8.23095703125, 9.19921875, 10.16748046875, 11.1357421875, 12.10400390625, 13.072265625, 14.04052734375, 15.0087890625, 15.97705078125, 16.9453125, 17.91357421875, 18.8818359375, 19.85009765625, 20.818359375, 21.78662109375, 22.7548828125, 23.72314453125, 24.69140625, 25.65966796875, 26.6279296875, 27.59619140625, 28.564453125, 29.53271484375, 30.5009765625, 31.46923828125, 32.4375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 17.0, 51.0, 68.0, 112.0, 185.0, 184.0, 132.0, 95.0, 60.0, 38.0, 8.0, 11.0, 4.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.59375, -28.77490234375, -27.9560546875, -27.13720703125, -26.318359375, -25.49951171875, -24.6806640625, -23.86181640625, -23.04296875, -22.22412109375, -21.4052734375, -20.58642578125, -19.767578125, -18.94873046875, -18.1298828125, -17.31103515625, -16.4921875, -15.67333984375, -14.8544921875, -14.03564453125, -13.216796875, -12.39794921875, -11.5791015625, -10.76025390625, -9.94140625, -9.12255859375, -8.3037109375, -7.48486328125, -6.666015625, -5.84716796875, -5.0283203125, -4.20947265625, -3.390625, -2.57177734375, -1.7529296875, -0.93408203125, -0.115234375, 0.70361328125, 1.5224609375, 2.34130859375, 3.16015625, 3.97900390625, 4.7978515625, 5.61669921875, 6.435546875, 7.25439453125, 8.0732421875, 8.89208984375, 9.7109375, 10.52978515625, 11.3486328125, 12.16748046875, 12.986328125, 13.80517578125, 14.6240234375, 15.44287109375, 16.26171875, 17.08056640625, 17.8994140625, 18.71826171875, 19.537109375, 20.35595703125, 21.1748046875, 21.99365234375, 22.8125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 19.0, 66.0, 165.0, 291.0, 257.0, 131.0, 56.0, 12.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-947.981201171875, -928.575439453125, -909.1696166992188, -889.7638549804688, -870.3580322265625, -850.9522705078125, -831.5465087890625, -812.1406860351562, -792.7349243164062, -773.3291625976562, -753.92333984375, -734.517578125, -715.1117553710938, -695.7059936523438, -676.3001708984375, -656.8944091796875, -637.4886474609375, -618.0828857421875, -598.6770629882812, -579.2713012695312, -559.865478515625, -540.459716796875, -521.053955078125, -501.64813232421875, -482.2423095703125, -462.8365173339844, -443.43072509765625, -424.02496337890625, -404.6191711425781, -385.21337890625, -365.8075866699219, -346.40179443359375, -326.9960021972656, -307.5902099609375, -288.1844177246094, -268.77862548828125, -249.37286376953125, -229.96707153320312, -210.561279296875, -191.15550231933594, -171.7497100830078, -152.3439178466797, -132.93814086914062, -113.5323486328125, -94.1265640258789, -74.72077941894531, -55.31498718261719, -35.909210205078125, -16.50341796875, 2.9023685455322266, 22.308155059814453, 41.71394348144531, 61.119728088378906, 80.5255126953125, 99.93130493164062, 119.33708190917969, 138.7428741455078, 158.14866638183594, 177.554443359375, 196.96023559570312, 216.36602783203125, 235.7718048095703, 255.17759704589844, 274.5833740234375, 293.9891662597656]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 13.0, 7.0, 8.0, 7.0, 13.0, 11.0, 20.0, 24.0, 29.0, 24.0, 39.0, 35.0, 39.0, 35.0, 47.0, 47.0, 49.0, 30.0, 40.0, 37.0, 56.0, 37.0, 34.0, 45.0, 35.0, 36.0, 29.0, 36.0, 16.0, 12.0, 20.0, 17.0, 16.0, 9.0, 7.0, 8.0, 6.0, 3.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-176.2188262939453, -171.19631958007812, -166.17381286621094, -161.15130615234375, -156.12879943847656, -151.10629272460938, -146.0837860107422, -141.061279296875, -136.0387725830078, -131.01626586914062, -125.99375915527344, -120.97125244140625, -115.94874572753906, -110.92623901367188, -105.90373229980469, -100.8812255859375, -95.85871124267578, -90.8362045288086, -85.8136978149414, -80.79119110107422, -75.76868438720703, -70.74617767333984, -65.72366333007812, -60.7011604309082, -55.678653717041016, -50.65614700317383, -45.63364028930664, -40.61112976074219, -35.588623046875, -30.566118240356445, -25.543609619140625, -20.521102905273438, -15.49859619140625, -10.476089477539062, -5.453581809997559, -0.4310741424560547, 4.591432571411133, 9.61393928527832, 14.63644790649414, 19.658954620361328, 24.681461334228516, 29.703968048095703, 34.72647476196289, 39.748985290527344, 44.77149200439453, 49.79399871826172, 54.816505432128906, 59.839012145996094, 64.86151885986328, 69.88402557373047, 74.90653228759766, 79.92903900146484, 84.95154571533203, 89.97405242919922, 94.99656677246094, 100.01907348632812, 105.04158020019531, 110.0640869140625, 115.08659362792969, 120.10910034179688, 125.13160705566406, 130.15411376953125, 135.17662048339844, 140.19912719726562, 145.2216339111328]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 4.0, 15.0, 18.0, 28.0, 28.0, 46.0, 59.0, 81.0, 106.0, 170.0, 214.0, 322.0, 530.0, 711.0, 1206.0, 1961.0, 3306.0, 5875.0, 12223.0, 31335.0, 117355.0, 3529191.0, 389619.0, 60109.0, 19977.0, 8690.0, 4462.0, 2496.0, 1453.0, 957.0, 543.0, 381.0, 260.0, 173.0, 123.0, 67.0, 67.0, 39.0, 26.0, 17.0, 11.0, 6.0, 5.0, 2.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-45.15625, -43.73486328125, -42.3134765625, -40.89208984375, -39.470703125, -38.04931640625, -36.6279296875, -35.20654296875, -33.78515625, -32.36376953125, -30.9423828125, -29.52099609375, -28.099609375, -26.67822265625, -25.2568359375, -23.83544921875, -22.4140625, -20.99267578125, -19.5712890625, -18.14990234375, -16.728515625, -15.30712890625, -13.8857421875, -12.46435546875, -11.04296875, -9.62158203125, -8.2001953125, -6.77880859375, -5.357421875, -3.93603515625, -2.5146484375, -1.09326171875, 0.328125, 1.74951171875, 3.1708984375, 4.59228515625, 6.013671875, 7.43505859375, 8.8564453125, 10.27783203125, 11.69921875, 13.12060546875, 14.5419921875, 15.96337890625, 17.384765625, 18.80615234375, 20.2275390625, 21.64892578125, 23.0703125, 24.49169921875, 25.9130859375, 27.33447265625, 28.755859375, 30.17724609375, 31.5986328125, 33.02001953125, 34.44140625, 35.86279296875, 37.2841796875, 38.70556640625, 40.126953125, 41.54833984375, 42.9697265625, 44.39111328125, 45.8125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 2.0, 9.0, 4.0, 9.0, 5.0, 12.0, 25.0, 20.0, 29.0, 25.0, 23.0, 39.0, 36.0, 42.0, 66.0, 46.0, 40.0, 59.0, 41.0, 48.0, 45.0, 44.0, 44.0, 32.0, 32.0, 39.0, 35.0, 24.0, 29.0, 20.0, 13.0, 16.0, 10.0, 11.0, 6.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.94921875, -7.73040771484375, -7.5115966796875, -7.29278564453125, -7.073974609375, -6.85516357421875, -6.6363525390625, -6.41754150390625, -6.19873046875, -5.97991943359375, -5.7611083984375, -5.54229736328125, -5.323486328125, -5.10467529296875, -4.8858642578125, -4.66705322265625, -4.4482421875, -4.22943115234375, -4.0106201171875, -3.79180908203125, -3.572998046875, -3.35418701171875, -3.1353759765625, -2.91656494140625, -2.69775390625, -2.47894287109375, -2.2601318359375, -2.04132080078125, -1.822509765625, -1.60369873046875, -1.3848876953125, -1.16607666015625, -0.947265625, -0.72845458984375, -0.5096435546875, -0.29083251953125, -0.072021484375, 0.14678955078125, 0.3656005859375, 0.58441162109375, 0.80322265625, 1.02203369140625, 1.2408447265625, 1.45965576171875, 1.678466796875, 1.89727783203125, 2.1160888671875, 2.33489990234375, 2.5537109375, 2.77252197265625, 2.9913330078125, 3.21014404296875, 3.428955078125, 3.64776611328125, 3.8665771484375, 4.08538818359375, 4.30419921875, 4.52301025390625, 4.7418212890625, 4.96063232421875, 5.179443359375, 5.39825439453125, 5.6170654296875, 5.83587646484375, 6.0546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 14.0, 20.0, 17.0, 21.0, 30.0, 33.0, 37.0, 42.0, 45.0, 67.0, 69.0, 108.0, 148.0, 224.0, 339.0, 544.0, 1037.0, 2258.0, 5027.0, 15493.0, 74735.0, 2946855.0, 1061756.0, 62012.0, 13734.0, 4771.0, 2027.0, 1060.0, 559.0, 305.0, 231.0, 164.0, 104.0, 87.0, 55.0, 50.0, 41.0, 27.0, 25.0, 30.0, 17.0, 12.0, 11.0, 10.0, 7.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-71.875, -69.7578125, -67.640625, -65.5234375, -63.40625, -61.2890625, -59.171875, -57.0546875, -54.9375, -52.8203125, -50.703125, -48.5859375, -46.46875, -44.3515625, -42.234375, -40.1171875, -38.0, -35.8828125, -33.765625, -31.6484375, -29.53125, -27.4140625, -25.296875, -23.1796875, -21.0625, -18.9453125, -16.828125, -14.7109375, -12.59375, -10.4765625, -8.359375, -6.2421875, -4.125, -2.0078125, 0.109375, 2.2265625, 4.34375, 6.4609375, 8.578125, 10.6953125, 12.8125, 14.9296875, 17.046875, 19.1640625, 21.28125, 23.3984375, 25.515625, 27.6328125, 29.75, 31.8671875, 33.984375, 36.1015625, 38.21875, 40.3359375, 42.453125, 44.5703125, 46.6875, 48.8046875, 50.921875, 53.0390625, 55.15625, 57.2734375, 59.390625, 61.5078125, 63.625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 14.0, 5.0, 19.0, 62.0, 100.0, 195.0, 649.0, 2325.0, 380.0, 150.0, 63.0, 39.0, 23.0, 19.0, 9.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.34375, -43.184814453125, -42.02587890625, -40.866943359375, -39.7080078125, -38.549072265625, -37.39013671875, -36.231201171875, -35.072265625, -33.913330078125, -32.75439453125, -31.595458984375, -30.4365234375, -29.277587890625, -28.11865234375, -26.959716796875, -25.80078125, -24.641845703125, -23.48291015625, -22.323974609375, -21.1650390625, -20.006103515625, -18.84716796875, -17.688232421875, -16.529296875, -15.370361328125, -14.21142578125, -13.052490234375, -11.8935546875, -10.734619140625, -9.57568359375, -8.416748046875, -7.2578125, -6.098876953125, -4.93994140625, -3.781005859375, -2.6220703125, -1.463134765625, -0.30419921875, 0.854736328125, 2.013671875, 3.172607421875, 4.33154296875, 5.490478515625, 6.6494140625, 7.808349609375, 8.96728515625, 10.126220703125, 11.28515625, 12.444091796875, 13.60302734375, 14.761962890625, 15.9208984375, 17.079833984375, 18.23876953125, 19.397705078125, 20.556640625, 21.715576171875, 22.87451171875, 24.033447265625, 25.1923828125, 26.351318359375, 27.51025390625, 28.669189453125, 29.828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 14.0, 34.0, 70.0, 136.0, 209.0, 219.0, 156.0, 77.0, 37.0, 23.0, 15.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.14600372314453, -97.03350067138672, -88.9209976196289, -80.8084945678711, -72.69599151611328, -64.58348846435547, -56.470985412597656, -48.358482360839844, -40.24597930908203, -32.13347625732422, -24.020973205566406, -15.908470153808594, -7.795967102050781, 0.31653594970703125, 8.429039001464844, 16.541542053222656, 24.65404510498047, 32.76654815673828, 40.879051208496094, 48.991554260253906, 57.10405731201172, 65.21656036376953, 73.32906341552734, 81.44156646728516, 89.55406951904297, 97.66657257080078, 105.7790756225586, 113.8915786743164, 122.00408172607422, 130.1165771484375, 138.22909545898438, 146.34158325195312, 154.4541015625, 162.5666046142578, 170.67910766601562, 178.79161071777344, 186.90411376953125, 195.01661682128906, 203.12911987304688, 211.2416229248047, 219.3541259765625, 227.4666290283203, 235.57913208007812, 243.69163513183594, 251.80413818359375, 259.9166259765625, 268.0291442871094, 276.14166259765625, 284.254150390625, 292.36663818359375, 300.4791564941406, 308.5916748046875, 316.70416259765625, 324.816650390625, 332.9291687011719, 341.04168701171875, 349.1541748046875, 357.26666259765625, 365.3791809082031, 373.49169921875, 381.60418701171875, 389.7166748046875, 397.8291931152344, 405.94171142578125, 414.05419921875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 3.0, 10.0, 7.0, 9.0, 11.0, 13.0, 18.0, 23.0, 29.0, 17.0, 30.0, 21.0, 33.0, 31.0, 32.0, 31.0, 42.0, 44.0, 38.0, 51.0, 40.0, 45.0, 33.0, 40.0, 40.0, 25.0, 25.0, 34.0, 24.0, 23.0, 21.0, 16.0, 18.0, 14.0, 15.0, 25.0, 10.0, 14.0, 5.0, 13.0, 7.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-72.34542083740234, -70.24555206298828, -68.14569091796875, -66.04582214355469, -63.94595718383789, -61.846092224121094, -59.74622344970703, -57.646358489990234, -55.54649353027344, -53.44662857055664, -51.346763610839844, -49.24689483642578, -47.147029876708984, -45.04716491699219, -42.947296142578125, -40.84743118286133, -38.74756622314453, -36.647701263427734, -34.54783630371094, -32.447967529296875, -30.348102569580078, -28.24823760986328, -26.14837074279785, -24.048503875732422, -21.948638916015625, -19.848773956298828, -17.7489070892334, -15.649041175842285, -13.549175262451172, -11.449309349060059, -9.349443435668945, -7.249577522277832, -5.149715423583984, -3.049849510192871, -0.9499835968017578, 1.1498823165893555, 3.2497482299804688, 5.349614143371582, 7.449480056762695, 9.549345970153809, 11.649211883544922, 13.749077796936035, 15.848943710327148, 17.948810577392578, 20.048675537109375, 22.148540496826172, 24.2484073638916, 26.34827423095703, 28.448139190673828, 30.548004150390625, 32.64787292480469, 34.747737884521484, 36.84760284423828, 38.94746780395508, 41.047332763671875, 43.14720153808594, 45.247066497802734, 47.34693145751953, 49.446800231933594, 51.54666519165039, 53.64653015136719, 55.746395111083984, 57.84626007080078, 59.946128845214844, 62.04599380493164]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 13.0, 13.0, 14.0, 38.0, 39.0, 57.0, 92.0, 141.0, 185.0, 389.0, 544.0, 919.0, 1722.0, 3140.0, 6254.0, 13382.0, 32580.0, 91712.0, 397513.0, 358154.0, 85201.0, 30840.0, 12652.0, 5942.0, 2985.0, 1615.0, 900.0, 539.0, 348.0, 222.0, 131.0, 73.0, 65.0, 36.0, 28.0, 23.0, 15.0, 14.0, 7.0, 8.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.78125, -40.43212890625, -39.0830078125, -37.73388671875, -36.384765625, -35.03564453125, -33.6865234375, -32.33740234375, -30.98828125, -29.63916015625, -28.2900390625, -26.94091796875, -25.591796875, -24.24267578125, -22.8935546875, -21.54443359375, -20.1953125, -18.84619140625, -17.4970703125, -16.14794921875, -14.798828125, -13.44970703125, -12.1005859375, -10.75146484375, -9.40234375, -8.05322265625, -6.7041015625, -5.35498046875, -4.005859375, -2.65673828125, -1.3076171875, 0.04150390625, 1.390625, 2.73974609375, 4.0888671875, 5.43798828125, 6.787109375, 8.13623046875, 9.4853515625, 10.83447265625, 12.18359375, 13.53271484375, 14.8818359375, 16.23095703125, 17.580078125, 18.92919921875, 20.2783203125, 21.62744140625, 22.9765625, 24.32568359375, 25.6748046875, 27.02392578125, 28.373046875, 29.72216796875, 31.0712890625, 32.42041015625, 33.76953125, 35.11865234375, 36.4677734375, 37.81689453125, 39.166015625, 40.51513671875, 41.8642578125, 43.21337890625, 44.5625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 5.0, 8.0, 10.0, 5.0, 13.0, 13.0, 26.0, 22.0, 28.0, 39.0, 36.0, 38.0, 44.0, 49.0, 40.0, 57.0, 46.0, 45.0, 47.0, 42.0, 41.0, 48.0, 40.0, 38.0, 28.0, 24.0, 32.0, 18.0, 28.0, 9.0, 16.0, 11.0, 13.0, 6.0, 11.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.5390625, -7.31964111328125, -7.1002197265625, -6.88079833984375, -6.661376953125, -6.44195556640625, -6.2225341796875, -6.00311279296875, -5.78369140625, -5.56427001953125, -5.3448486328125, -5.12542724609375, -4.906005859375, -4.68658447265625, -4.4671630859375, -4.24774169921875, -4.0283203125, -3.80889892578125, -3.5894775390625, -3.37005615234375, -3.150634765625, -2.93121337890625, -2.7117919921875, -2.49237060546875, -2.27294921875, -2.05352783203125, -1.8341064453125, -1.61468505859375, -1.395263671875, -1.17584228515625, -0.9564208984375, -0.73699951171875, -0.517578125, -0.29815673828125, -0.0787353515625, 0.14068603515625, 0.360107421875, 0.57952880859375, 0.7989501953125, 1.01837158203125, 1.23779296875, 1.45721435546875, 1.6766357421875, 1.89605712890625, 2.115478515625, 2.33489990234375, 2.5543212890625, 2.77374267578125, 2.9931640625, 3.21258544921875, 3.4320068359375, 3.65142822265625, 3.870849609375, 4.09027099609375, 4.3096923828125, 4.52911376953125, 4.74853515625, 4.96795654296875, 5.1873779296875, 5.40679931640625, 5.626220703125, 5.84564208984375, 6.0650634765625, 6.28448486328125, 6.50390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 6.0, 6.0, 15.0, 8.0, 27.0, 25.0, 47.0, 53.0, 80.0, 131.0, 220.0, 326.0, 483.0, 768.0, 1352.0, 2267.0, 4538.0, 10369.0, 30607.0, 123809.0, 600582.0, 201603.0, 44520.0, 13989.0, 5652.0, 2858.0, 1597.0, 952.0, 608.0, 328.0, 214.0, 142.0, 98.0, 75.0, 49.0, 29.0, 24.0, 25.0, 11.0, 8.0, 8.0, 7.0, 9.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-42.46875, -41.16796875, -39.8671875, -38.56640625, -37.265625, -35.96484375, -34.6640625, -33.36328125, -32.0625, -30.76171875, -29.4609375, -28.16015625, -26.859375, -25.55859375, -24.2578125, -22.95703125, -21.65625, -20.35546875, -19.0546875, -17.75390625, -16.453125, -15.15234375, -13.8515625, -12.55078125, -11.25, -9.94921875, -8.6484375, -7.34765625, -6.046875, -4.74609375, -3.4453125, -2.14453125, -0.84375, 0.45703125, 1.7578125, 3.05859375, 4.359375, 5.66015625, 6.9609375, 8.26171875, 9.5625, 10.86328125, 12.1640625, 13.46484375, 14.765625, 16.06640625, 17.3671875, 18.66796875, 19.96875, 21.26953125, 22.5703125, 23.87109375, 25.171875, 26.47265625, 27.7734375, 29.07421875, 30.375, 31.67578125, 32.9765625, 34.27734375, 35.578125, 36.87890625, 38.1796875, 39.48046875, 40.78125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 12.0, 12.0, 9.0, 22.0, 17.0, 28.0, 29.0, 52.0, 48.0, 45.0, 31.0, 72.0, 51.0, 69.0, 62.0, 60.0, 58.0, 42.0, 44.0, 52.0, 34.0, 36.0, 26.0, 19.0, 12.0, 10.0, 10.0, 8.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.515625, -30.291259765625, -29.06689453125, -27.842529296875, -26.6181640625, -25.393798828125, -24.16943359375, -22.945068359375, -21.720703125, -20.496337890625, -19.27197265625, -18.047607421875, -16.8232421875, -15.598876953125, -14.37451171875, -13.150146484375, -11.92578125, -10.701416015625, -9.47705078125, -8.252685546875, -7.0283203125, -5.803955078125, -4.57958984375, -3.355224609375, -2.130859375, -0.906494140625, 0.31787109375, 1.542236328125, 2.7666015625, 3.990966796875, 5.21533203125, 6.439697265625, 7.6640625, 8.888427734375, 10.11279296875, 11.337158203125, 12.5615234375, 13.785888671875, 15.01025390625, 16.234619140625, 17.458984375, 18.683349609375, 19.90771484375, 21.132080078125, 22.3564453125, 23.580810546875, 24.80517578125, 26.029541015625, 27.25390625, 28.478271484375, 29.70263671875, 30.927001953125, 32.1513671875, 33.375732421875, 34.60009765625, 35.824462890625, 37.048828125, 38.273193359375, 39.49755859375, 40.721923828125, 41.9462890625, 43.170654296875, 44.39501953125, 45.619384765625, 46.84375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 14.0, 13.0, 19.0, 23.0, 47.0, 48.0, 101.0, 114.0, 182.0, 330.0, 524.0, 978.0, 1976.0, 4405.0, 11937.0, 41592.0, 286570.0, 591956.0, 77240.0, 18320.0, 6445.0, 2655.0, 1274.0, 715.0, 393.0, 239.0, 126.0, 82.0, 63.0, 42.0, 38.0, 20.0, 18.0, 14.0, 5.0, 5.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.796875, -21.074951171875, -20.35302734375, -19.631103515625, -18.9091796875, -18.187255859375, -17.46533203125, -16.743408203125, -16.021484375, -15.299560546875, -14.57763671875, -13.855712890625, -13.1337890625, -12.411865234375, -11.68994140625, -10.968017578125, -10.24609375, -9.524169921875, -8.80224609375, -8.080322265625, -7.3583984375, -6.636474609375, -5.91455078125, -5.192626953125, -4.470703125, -3.748779296875, -3.02685546875, -2.304931640625, -1.5830078125, -0.861083984375, -0.13916015625, 0.582763671875, 1.3046875, 2.026611328125, 2.74853515625, 3.470458984375, 4.1923828125, 4.914306640625, 5.63623046875, 6.358154296875, 7.080078125, 7.802001953125, 8.52392578125, 9.245849609375, 9.9677734375, 10.689697265625, 11.41162109375, 12.133544921875, 12.85546875, 13.577392578125, 14.29931640625, 15.021240234375, 15.7431640625, 16.465087890625, 17.18701171875, 17.908935546875, 18.630859375, 19.352783203125, 20.07470703125, 20.796630859375, 21.5185546875, 22.240478515625, 22.96240234375, 23.684326171875, 24.40625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 18.0, 19.0, 64.0, 180.0, 400.0, 180.0, 60.0, 26.0, 17.0, 7.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.018890380859375, -0.01849287748336792, -0.01809537410736084, -0.01769787073135376, -0.01730036735534668, -0.0169028639793396, -0.01650536060333252, -0.01610785722732544, -0.01571035385131836, -0.01531285047531128, -0.0149153470993042, -0.01451784372329712, -0.014120340347290039, -0.013722836971282959, -0.013325333595275879, -0.012927830219268799, -0.012530326843261719, -0.012132823467254639, -0.011735320091247559, -0.011337816715240479, -0.010940313339233398, -0.010542809963226318, -0.010145306587219238, -0.009747803211212158, -0.009350299835205078, -0.008952796459197998, -0.008555293083190918, -0.008157789707183838, -0.007760286331176758, -0.007362782955169678, -0.006965279579162598, -0.006567776203155518, -0.0061702728271484375, -0.005772769451141357, -0.005375266075134277, -0.004977762699127197, -0.004580259323120117, -0.004182755947113037, -0.003785252571105957, -0.003387749195098877, -0.002990245819091797, -0.002592742443084717, -0.0021952390670776367, -0.0017977356910705566, -0.0014002323150634766, -0.0010027289390563965, -0.0006052255630493164, -0.00020772218704223633, 0.00018978118896484375, 0.0005872845649719238, 0.000984787940979004, 0.001382291316986084, 0.001779794692993164, 0.002177298069000244, 0.0025748014450073242, 0.0029723048210144043, 0.0033698081970214844, 0.0037673115730285645, 0.0041648149490356445, 0.004562318325042725, 0.004959821701049805, 0.005357325077056885, 0.005754828453063965, 0.006152331829071045, 0.006549835205078125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 12.0, 11.0, 20.0, 30.0, 32.0, 63.0, 72.0, 134.0, 242.0, 374.0, 670.0, 1150.0, 2310.0, 5140.0, 13539.0, 44681.0, 276872.0, 581807.0, 85428.0, 21361.0, 7818.0, 3175.0, 1603.0, 806.0, 471.0, 266.0, 146.0, 110.0, 76.0, 32.0, 24.0, 26.0, 19.0, 11.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15625, -18.5615234375, -17.966796875, -17.3720703125, -16.77734375, -16.1826171875, -15.587890625, -14.9931640625, -14.3984375, -13.8037109375, -13.208984375, -12.6142578125, -12.01953125, -11.4248046875, -10.830078125, -10.2353515625, -9.640625, -9.0458984375, -8.451171875, -7.8564453125, -7.26171875, -6.6669921875, -6.072265625, -5.4775390625, -4.8828125, -4.2880859375, -3.693359375, -3.0986328125, -2.50390625, -1.9091796875, -1.314453125, -0.7197265625, -0.125, 0.4697265625, 1.064453125, 1.6591796875, 2.25390625, 2.8486328125, 3.443359375, 4.0380859375, 4.6328125, 5.2275390625, 5.822265625, 6.4169921875, 7.01171875, 7.6064453125, 8.201171875, 8.7958984375, 9.390625, 9.9853515625, 10.580078125, 11.1748046875, 11.76953125, 12.3642578125, 12.958984375, 13.5537109375, 14.1484375, 14.7431640625, 15.337890625, 15.9326171875, 16.52734375, 17.1220703125, 17.716796875, 18.3115234375, 18.90625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 12.0, 5.0, 16.0, 19.0, 35.0, 55.0, 62.0, 92.0, 119.0, 108.0, 106.0, 87.0, 79.0, 53.0, 29.0, 19.0, 14.0, 12.0, 13.0, 6.0, 4.0, 10.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-18.21875, -17.7586669921875, -17.298583984375, -16.8385009765625, -16.37841796875, -15.9183349609375, -15.458251953125, -14.9981689453125, -14.5380859375, -14.0780029296875, -13.617919921875, -13.1578369140625, -12.69775390625, -12.2376708984375, -11.777587890625, -11.3175048828125, -10.857421875, -10.3973388671875, -9.937255859375, -9.4771728515625, -9.01708984375, -8.5570068359375, -8.096923828125, -7.6368408203125, -7.1767578125, -6.7166748046875, -6.256591796875, -5.7965087890625, -5.33642578125, -4.8763427734375, -4.416259765625, -3.9561767578125, -3.49609375, -3.0360107421875, -2.575927734375, -2.1158447265625, -1.65576171875, -1.1956787109375, -0.735595703125, -0.2755126953125, 0.1845703125, 0.6446533203125, 1.104736328125, 1.5648193359375, 2.02490234375, 2.4849853515625, 2.945068359375, 3.4051513671875, 3.865234375, 4.3253173828125, 4.785400390625, 5.2454833984375, 5.70556640625, 6.1656494140625, 6.625732421875, 7.0858154296875, 7.5458984375, 8.0059814453125, 8.466064453125, 8.9261474609375, 9.38623046875, 9.8463134765625, 10.306396484375, 10.7664794921875, 11.2265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 3.0, 16.0, 25.0, 46.0, 65.0, 113.0, 128.0, 141.0, 135.0, 114.0, 72.0, 66.0, 23.0, 25.0, 13.0, 10.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-304.1841735839844, -294.5325622558594, -284.8809814453125, -275.2293701171875, -265.5777587890625, -255.92616271972656, -246.27456665039062, -236.62295532226562, -226.9713592529297, -217.31976318359375, -207.66815185546875, -198.0165557861328, -188.36495971679688, -178.71334838867188, -169.06175231933594, -159.41015625, -149.758544921875, -140.10694885253906, -130.45533752441406, -120.80374145507812, -111.15213775634766, -101.50053405761719, -91.84893798828125, -82.19733428955078, -72.54573059082031, -62.894126892089844, -53.24252700805664, -43.59092712402344, -33.93932342529297, -24.2877197265625, -14.636119842529297, -4.984519958496094, 4.667083740234375, 14.318685531616211, 23.970287322998047, 33.62188720703125, 43.27349090576172, 52.92509460449219, 62.57669448852539, 72.2282943725586, 81.87989807128906, 91.53150177001953, 101.18310546875, 110.83470153808594, 120.4863052368164, 130.13790893554688, 139.7895050048828, 149.44110107421875, 159.09271240234375, 168.7443084716797, 178.3959197998047, 188.04751586914062, 197.69912719726562, 207.35072326660156, 217.0023193359375, 226.6539306640625, 236.30552673339844, 245.95712280273438, 255.60873413085938, 265.2603454589844, 274.91192626953125, 284.56353759765625, 294.21514892578125, 303.8667297363281, 313.5183410644531]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 4.0, 10.0, 8.0, 5.0, 13.0, 17.0, 19.0, 18.0, 35.0, 16.0, 22.0, 35.0, 33.0, 49.0, 43.0, 34.0, 42.0, 41.0, 51.0, 40.0, 41.0, 41.0, 40.0, 42.0, 42.0, 34.0, 26.0, 34.0, 26.0, 22.0, 15.0, 17.0, 12.0, 9.0, 9.0, 12.0, 8.0, 9.0, 8.0, 3.0, 1.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-171.1358642578125, -166.36476135253906, -161.59365844726562, -156.8225555419922, -152.05145263671875, -147.28036499023438, -142.50926208496094, -137.7381591796875, -132.96705627441406, -128.19595336914062, -123.42485046386719, -118.65375518798828, -113.88265228271484, -109.1115493774414, -104.3404541015625, -99.56935119628906, -94.79824829101562, -90.02714538574219, -85.25604248046875, -80.48494720458984, -75.7138442993164, -70.94274139404297, -66.17164611816406, -61.400543212890625, -56.62944030761719, -51.85833740234375, -47.08723831176758, -42.316139221191406, -37.54503631591797, -32.77393341064453, -28.00283432006836, -23.231735229492188, -18.460617065429688, -13.689516067504883, -8.918415069580078, -4.147314071655273, 0.6237869262695312, 5.394887924194336, 10.16598892211914, 14.937088012695312, 19.70819091796875, 24.479291915893555, 29.25039291381836, 34.02149200439453, 38.79259490966797, 43.563697814941406, 48.33479690551758, 53.10589599609375, 57.87699890136719, 62.648101806640625, 67.41920471191406, 72.19029998779297, 76.9614028930664, 81.73250579833984, 86.50360107421875, 91.27470397949219, 96.04580688476562, 100.81690979003906, 105.5880126953125, 110.3591079711914, 115.13021087646484, 119.90131378173828, 124.67240905761719, 129.44351196289062, 134.21461486816406]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 8.0, 2.0, 6.0, 6.0, 17.0, 15.0, 34.0, 36.0, 52.0, 81.0, 103.0, 154.0, 253.0, 404.0, 669.0, 1215.0, 2237.0, 4708.0, 10735.0, 32251.0, 236190.0, 3794677.0, 77477.0, 18548.0, 7120.0, 3282.0, 1661.0, 873.0, 549.0, 342.0, 218.0, 125.0, 86.0, 39.0, 38.0, 26.0, 20.0, 13.0, 4.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.25, -74.2041015625, -72.158203125, -70.1123046875, -68.06640625, -66.0205078125, -63.974609375, -61.9287109375, -59.8828125, -57.8369140625, -55.791015625, -53.7451171875, -51.69921875, -49.6533203125, -47.607421875, -45.5615234375, -43.515625, -41.4697265625, -39.423828125, -37.3779296875, -35.33203125, -33.2861328125, -31.240234375, -29.1943359375, -27.1484375, -25.1025390625, -23.056640625, -21.0107421875, -18.96484375, -16.9189453125, -14.873046875, -12.8271484375, -10.78125, -8.7353515625, -6.689453125, -4.6435546875, -2.59765625, -0.5517578125, 1.494140625, 3.5400390625, 5.5859375, 7.6318359375, 9.677734375, 11.7236328125, 13.76953125, 15.8154296875, 17.861328125, 19.9072265625, 21.953125, 23.9990234375, 26.044921875, 28.0908203125, 30.13671875, 32.1826171875, 34.228515625, 36.2744140625, 38.3203125, 40.3662109375, 42.412109375, 44.4580078125, 46.50390625, 48.5498046875, 50.595703125, 52.6416015625, 54.6875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 7.0, 14.0, 15.0, 8.0, 17.0, 15.0, 20.0, 34.0, 39.0, 42.0, 46.0, 44.0, 57.0, 58.0, 36.0, 51.0, 45.0, 42.0, 52.0, 44.0, 55.0, 46.0, 33.0, 37.0, 29.0, 23.0, 14.0, 24.0, 11.0, 7.0, 6.0, 8.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.0523681640625, -7.792236328125, -7.5321044921875, -7.27197265625, -7.0118408203125, -6.751708984375, -6.4915771484375, -6.2314453125, -5.9713134765625, -5.711181640625, -5.4510498046875, -5.19091796875, -4.9307861328125, -4.670654296875, -4.4105224609375, -4.150390625, -3.8902587890625, -3.630126953125, -3.3699951171875, -3.10986328125, -2.8497314453125, -2.589599609375, -2.3294677734375, -2.0693359375, -1.8092041015625, -1.549072265625, -1.2889404296875, -1.02880859375, -0.7686767578125, -0.508544921875, -0.2484130859375, 0.01171875, 0.2718505859375, 0.531982421875, 0.7921142578125, 1.05224609375, 1.3123779296875, 1.572509765625, 1.8326416015625, 2.0927734375, 2.3529052734375, 2.613037109375, 2.8731689453125, 3.13330078125, 3.3934326171875, 3.653564453125, 3.9136962890625, 4.173828125, 4.4339599609375, 4.694091796875, 4.9542236328125, 5.21435546875, 5.4744873046875, 5.734619140625, 5.9947509765625, 6.2548828125, 6.5150146484375, 6.775146484375, 7.0352783203125, 7.29541015625, 7.5555419921875, 7.815673828125, 8.0758056640625, 8.3359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 11.0, 16.0, 18.0, 22.0, 21.0, 45.0, 53.0, 76.0, 140.0, 200.0, 342.0, 569.0, 1052.0, 2346.0, 6104.0, 20481.0, 143394.0, 3863223.0, 125591.0, 19523.0, 6054.0, 2356.0, 1124.0, 582.0, 323.0, 181.0, 146.0, 78.0, 52.0, 33.0, 22.0, 18.0, 14.0, 15.0, 7.0, 5.0, 5.0, 7.0, 8.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-91.8125, -89.1494140625, -86.486328125, -83.8232421875, -81.16015625, -78.4970703125, -75.833984375, -73.1708984375, -70.5078125, -67.8447265625, -65.181640625, -62.5185546875, -59.85546875, -57.1923828125, -54.529296875, -51.8662109375, -49.203125, -46.5400390625, -43.876953125, -41.2138671875, -38.55078125, -35.8876953125, -33.224609375, -30.5615234375, -27.8984375, -25.2353515625, -22.572265625, -19.9091796875, -17.24609375, -14.5830078125, -11.919921875, -9.2568359375, -6.59375, -3.9306640625, -1.267578125, 1.3955078125, 4.05859375, 6.7216796875, 9.384765625, 12.0478515625, 14.7109375, 17.3740234375, 20.037109375, 22.7001953125, 25.36328125, 28.0263671875, 30.689453125, 33.3525390625, 36.015625, 38.6787109375, 41.341796875, 44.0048828125, 46.66796875, 49.3310546875, 51.994140625, 54.6572265625, 57.3203125, 59.9833984375, 62.646484375, 65.3095703125, 67.97265625, 70.6357421875, 73.298828125, 75.9619140625, 78.625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 17.0, 30.0, 33.0, 92.0, 223.0, 988.0, 2253.0, 228.0, 84.0, 33.0, 25.0, 14.0, 12.0, 11.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.1875, -48.994140625, -47.80078125, -46.607421875, -45.4140625, -44.220703125, -43.02734375, -41.833984375, -40.640625, -39.447265625, -38.25390625, -37.060546875, -35.8671875, -34.673828125, -33.48046875, -32.287109375, -31.09375, -29.900390625, -28.70703125, -27.513671875, -26.3203125, -25.126953125, -23.93359375, -22.740234375, -21.546875, -20.353515625, -19.16015625, -17.966796875, -16.7734375, -15.580078125, -14.38671875, -13.193359375, -12.0, -10.806640625, -9.61328125, -8.419921875, -7.2265625, -6.033203125, -4.83984375, -3.646484375, -2.453125, -1.259765625, -0.06640625, 1.126953125, 2.3203125, 3.513671875, 4.70703125, 5.900390625, 7.09375, 8.287109375, 9.48046875, 10.673828125, 11.8671875, 13.060546875, 14.25390625, 15.447265625, 16.640625, 17.833984375, 19.02734375, 20.220703125, 21.4140625, 22.607421875, 23.80078125, 24.994140625, 26.1875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 17.0, 36.0, 105.0, 272.0, 328.0, 171.0, 46.0, 15.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-497.5877380371094, -486.80401611328125, -476.0202941894531, -465.236572265625, -454.4528503417969, -443.66912841796875, -432.88543701171875, -422.1017150878906, -411.3179931640625, -400.5342712402344, -389.75054931640625, -378.9668273925781, -368.18310546875, -357.3994140625, -346.61566162109375, -335.83197021484375, -325.0482177734375, -314.2644958496094, -303.48077392578125, -292.6970520019531, -281.913330078125, -271.129638671875, -260.34588623046875, -249.56219482421875, -238.77847290039062, -227.9947509765625, -217.21102905273438, -206.42730712890625, -195.6436004638672, -184.85987854003906, -174.07615661621094, -163.29244995117188, -152.5087432861328, -141.7250213623047, -130.94129943847656, -120.15758514404297, -109.37387084960938, -98.59014892578125, -87.80642700195312, -77.02271270751953, -66.2389907836914, -55.45527267456055, -44.67155456542969, -33.88783264160156, -23.104114532470703, -12.320396423339844, -1.5366744995117188, 9.247039794921875, 20.03076171875, 30.81447982788086, 41.59819793701172, 52.381919860839844, 63.1656379699707, 73.94935607910156, 84.73307800292969, 95.51679229736328, 106.3005142211914, 117.08423614501953, 127.86795043945312, 138.65167236328125, 149.43539428710938, 160.2191162109375, 171.00283813476562, 181.7865447998047, 192.5702667236328]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 7.0, 6.0, 7.0, 13.0, 21.0, 9.0, 19.0, 22.0, 30.0, 34.0, 40.0, 40.0, 40.0, 49.0, 54.0, 50.0, 54.0, 49.0, 46.0, 46.0, 42.0, 47.0, 43.0, 39.0, 31.0, 23.0, 26.0, 24.0, 20.0, 9.0, 7.0, 12.0, 11.0, 6.0, 5.0, 7.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.95223999023438, -70.51971435546875, -68.0871810913086, -65.65465545654297, -63.22212600708008, -60.78959655761719, -58.35707092285156, -55.92454147338867, -53.49201202392578, -51.05948257446289, -48.626953125, -46.194427490234375, -43.761898040771484, -41.329368591308594, -38.89684295654297, -36.46431350708008, -34.03178405761719, -31.599254608154297, -29.16672706604004, -26.73419952392578, -24.30167007446289, -21.869140625, -19.436613082885742, -17.004085540771484, -14.571556091308594, -12.13902759552002, -9.706499099731445, -7.273970603942871, -4.841442108154297, -2.4089136123657227, 0.023614883422851562, 2.4561424255371094, 4.888671875, 7.321200370788574, 9.753728866577148, 12.186257362365723, 14.618785858154297, 17.051315307617188, 19.483842849731445, 21.916370391845703, 24.348899841308594, 26.781429290771484, 29.213956832885742, 31.646484375, 34.07901382446289, 36.51154327392578, 38.944068908691406, 41.3765983581543, 43.80912780761719, 46.24165725708008, 48.67418670654297, 51.106712341308594, 53.539241790771484, 55.971771240234375, 58.404296875, 60.83682632446289, 63.26935577392578, 65.7018814086914, 68.13441467285156, 70.56694030761719, 72.99946594238281, 75.43199920654297, 77.8645248413086, 80.29705810546875, 82.72958374023438]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 0.0, 1.0, 10.0, 12.0, 19.0, 15.0, 22.0, 49.0, 55.0, 91.0, 116.0, 187.0, 273.0, 346.0, 558.0, 885.0, 1421.0, 2339.0, 3864.0, 6781.0, 13252.0, 26668.0, 57851.0, 145256.0, 408541.0, 224001.0, 81783.0, 35703.0, 17219.0, 8670.0, 4855.0, 2850.0, 1689.0, 1037.0, 685.0, 437.0, 310.0, 192.0, 131.0, 108.0, 79.0, 46.0, 42.0, 36.0, 29.0, 13.0, 6.0, 10.0, 8.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-27.3125, -26.501953125, -25.69140625, -24.880859375, -24.0703125, -23.259765625, -22.44921875, -21.638671875, -20.828125, -20.017578125, -19.20703125, -18.396484375, -17.5859375, -16.775390625, -15.96484375, -15.154296875, -14.34375, -13.533203125, -12.72265625, -11.912109375, -11.1015625, -10.291015625, -9.48046875, -8.669921875, -7.859375, -7.048828125, -6.23828125, -5.427734375, -4.6171875, -3.806640625, -2.99609375, -2.185546875, -1.375, -0.564453125, 0.24609375, 1.056640625, 1.8671875, 2.677734375, 3.48828125, 4.298828125, 5.109375, 5.919921875, 6.73046875, 7.541015625, 8.3515625, 9.162109375, 9.97265625, 10.783203125, 11.59375, 12.404296875, 13.21484375, 14.025390625, 14.8359375, 15.646484375, 16.45703125, 17.267578125, 18.078125, 18.888671875, 19.69921875, 20.509765625, 21.3203125, 22.130859375, 22.94140625, 23.751953125, 24.5625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 7.0, 4.0, 4.0, 8.0, 6.0, 9.0, 6.0, 12.0, 12.0, 18.0, 24.0, 14.0, 25.0, 34.0, 25.0, 39.0, 33.0, 39.0, 31.0, 25.0, 36.0, 47.0, 37.0, 43.0, 46.0, 42.0, 43.0, 40.0, 29.0, 33.0, 30.0, 30.0, 23.0, 25.0, 24.0, 19.0, 12.0, 8.0, 14.0, 9.0, 5.0, 9.0, 6.0, 9.0, 7.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-7.71875, -7.4967041015625, -7.274658203125, -7.0526123046875, -6.83056640625, -6.6085205078125, -6.386474609375, -6.1644287109375, -5.9423828125, -5.7203369140625, -5.498291015625, -5.2762451171875, -5.05419921875, -4.8321533203125, -4.610107421875, -4.3880615234375, -4.166015625, -3.9439697265625, -3.721923828125, -3.4998779296875, -3.27783203125, -3.0557861328125, -2.833740234375, -2.6116943359375, -2.3896484375, -2.1676025390625, -1.945556640625, -1.7235107421875, -1.50146484375, -1.2794189453125, -1.057373046875, -0.8353271484375, -0.61328125, -0.3912353515625, -0.169189453125, 0.0528564453125, 0.27490234375, 0.4969482421875, 0.718994140625, 0.9410400390625, 1.1630859375, 1.3851318359375, 1.607177734375, 1.8292236328125, 2.05126953125, 2.2733154296875, 2.495361328125, 2.7174072265625, 2.939453125, 3.1614990234375, 3.383544921875, 3.6055908203125, 3.82763671875, 4.0496826171875, 4.271728515625, 4.4937744140625, 4.7158203125, 4.9378662109375, 5.159912109375, 5.3819580078125, 5.60400390625, 5.8260498046875, 6.048095703125, 6.2701416015625, 6.4921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 17.0, 19.0, 27.0, 35.0, 53.0, 76.0, 126.0, 191.0, 293.0, 533.0, 895.0, 1561.0, 2923.0, 6259.0, 15001.0, 41950.0, 175214.0, 624114.0, 122420.0, 33123.0, 12354.0, 5306.0, 2652.0, 1330.0, 740.0, 480.0, 289.0, 167.0, 128.0, 69.0, 54.0, 34.0, 21.0, 15.0, 18.0, 12.0, 13.0, 4.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-43.71875, -42.40966796875, -41.1005859375, -39.79150390625, -38.482421875, -37.17333984375, -35.8642578125, -34.55517578125, -33.24609375, -31.93701171875, -30.6279296875, -29.31884765625, -28.009765625, -26.70068359375, -25.3916015625, -24.08251953125, -22.7734375, -21.46435546875, -20.1552734375, -18.84619140625, -17.537109375, -16.22802734375, -14.9189453125, -13.60986328125, -12.30078125, -10.99169921875, -9.6826171875, -8.37353515625, -7.064453125, -5.75537109375, -4.4462890625, -3.13720703125, -1.828125, -0.51904296875, 0.7900390625, 2.09912109375, 3.408203125, 4.71728515625, 6.0263671875, 7.33544921875, 8.64453125, 9.95361328125, 11.2626953125, 12.57177734375, 13.880859375, 15.18994140625, 16.4990234375, 17.80810546875, 19.1171875, 20.42626953125, 21.7353515625, 23.04443359375, 24.353515625, 25.66259765625, 26.9716796875, 28.28076171875, 29.58984375, 30.89892578125, 32.2080078125, 33.51708984375, 34.826171875, 36.13525390625, 37.4443359375, 38.75341796875, 40.0625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 4.0, 9.0, 10.0, 19.0, 19.0, 31.0, 32.0, 40.0, 55.0, 53.0, 55.0, 59.0, 67.0, 74.0, 63.0, 64.0, 61.0, 42.0, 47.0, 33.0, 26.0, 29.0, 22.0, 19.0, 11.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.46875, -48.88427734375, -47.2998046875, -45.71533203125, -44.130859375, -42.54638671875, -40.9619140625, -39.37744140625, -37.79296875, -36.20849609375, -34.6240234375, -33.03955078125, -31.455078125, -29.87060546875, -28.2861328125, -26.70166015625, -25.1171875, -23.53271484375, -21.9482421875, -20.36376953125, -18.779296875, -17.19482421875, -15.6103515625, -14.02587890625, -12.44140625, -10.85693359375, -9.2724609375, -7.68798828125, -6.103515625, -4.51904296875, -2.9345703125, -1.35009765625, 0.234375, 1.81884765625, 3.4033203125, 4.98779296875, 6.572265625, 8.15673828125, 9.7412109375, 11.32568359375, 12.91015625, 14.49462890625, 16.0791015625, 17.66357421875, 19.248046875, 20.83251953125, 22.4169921875, 24.00146484375, 25.5859375, 27.17041015625, 28.7548828125, 30.33935546875, 31.923828125, 33.50830078125, 35.0927734375, 36.67724609375, 38.26171875, 39.84619140625, 41.4306640625, 43.01513671875, 44.599609375, 46.18408203125, 47.7685546875, 49.35302734375, 50.9375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 17.0, 21.0, 33.0, 35.0, 37.0, 65.0, 82.0, 155.0, 231.0, 393.0, 631.0, 1192.0, 2055.0, 4010.0, 8994.0, 24223.0, 95114.0, 565868.0, 269306.0, 48105.0, 14957.0, 6213.0, 2909.0, 1560.0, 849.0, 531.0, 295.0, 202.0, 147.0, 88.0, 51.0, 47.0, 30.0, 18.0, 9.0, 13.0, 12.0, 6.0, 10.0, 3.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.171875, -18.604248046875, -18.03662109375, -17.468994140625, -16.9013671875, -16.333740234375, -15.76611328125, -15.198486328125, -14.630859375, -14.063232421875, -13.49560546875, -12.927978515625, -12.3603515625, -11.792724609375, -11.22509765625, -10.657470703125, -10.08984375, -9.522216796875, -8.95458984375, -8.386962890625, -7.8193359375, -7.251708984375, -6.68408203125, -6.116455078125, -5.548828125, -4.981201171875, -4.41357421875, -3.845947265625, -3.2783203125, -2.710693359375, -2.14306640625, -1.575439453125, -1.0078125, -0.440185546875, 0.12744140625, 0.695068359375, 1.2626953125, 1.830322265625, 2.39794921875, 2.965576171875, 3.533203125, 4.100830078125, 4.66845703125, 5.236083984375, 5.8037109375, 6.371337890625, 6.93896484375, 7.506591796875, 8.07421875, 8.641845703125, 9.20947265625, 9.777099609375, 10.3447265625, 10.912353515625, 11.47998046875, 12.047607421875, 12.615234375, 13.182861328125, 13.75048828125, 14.318115234375, 14.8857421875, 15.453369140625, 16.02099609375, 16.588623046875, 17.15625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 13.0, 14.0, 15.0, 40.0, 81.0, 342.0, 316.0, 81.0, 27.0, 25.0, 16.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01345062255859375, -0.013065934181213379, -0.012681245803833008, -0.012296557426452637, -0.011911869049072266, -0.011527180671691895, -0.011142492294311523, -0.010757803916931152, -0.010373115539550781, -0.00998842716217041, -0.009603738784790039, -0.009219050407409668, -0.008834362030029297, -0.008449673652648926, -0.008064985275268555, -0.007680296897888184, -0.0072956085205078125, -0.006910920143127441, -0.00652623176574707, -0.006141543388366699, -0.005756855010986328, -0.005372166633605957, -0.004987478256225586, -0.004602789878845215, -0.004218101501464844, -0.0038334131240844727, -0.0034487247467041016, -0.0030640363693237305, -0.0026793479919433594, -0.0022946596145629883, -0.0019099712371826172, -0.001525282859802246, -0.001140594482421875, -0.0007559061050415039, -0.0003712177276611328, 1.3470649719238281e-05, 0.0003981590270996094, 0.0007828474044799805, 0.0011675357818603516, 0.0015522241592407227, 0.0019369125366210938, 0.002321600914001465, 0.002706289291381836, 0.003090977668762207, 0.003475666046142578, 0.0038603544235229492, 0.00424504280090332, 0.004629731178283691, 0.0050144195556640625, 0.005399107933044434, 0.005783796310424805, 0.006168484687805176, 0.006553173065185547, 0.006937861442565918, 0.007322549819946289, 0.00770723819732666, 0.008091926574707031, 0.008476614952087402, 0.008861303329467773, 0.009245991706848145, 0.009630680084228516, 0.010015368461608887, 0.010400056838989258, 0.010784745216369629, 0.01116943359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 12.0, 20.0, 35.0, 53.0, 54.0, 109.0, 163.0, 319.0, 557.0, 1103.0, 2364.0, 6106.0, 19826.0, 98932.0, 732409.0, 148827.0, 24762.0, 7344.0, 2849.0, 1210.0, 640.0, 338.0, 205.0, 107.0, 58.0, 43.0, 31.0, 16.0, 10.0, 15.0, 9.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.28125, -26.53564453125, -25.7900390625, -25.04443359375, -24.298828125, -23.55322265625, -22.8076171875, -22.06201171875, -21.31640625, -20.57080078125, -19.8251953125, -19.07958984375, -18.333984375, -17.58837890625, -16.8427734375, -16.09716796875, -15.3515625, -14.60595703125, -13.8603515625, -13.11474609375, -12.369140625, -11.62353515625, -10.8779296875, -10.13232421875, -9.38671875, -8.64111328125, -7.8955078125, -7.14990234375, -6.404296875, -5.65869140625, -4.9130859375, -4.16748046875, -3.421875, -2.67626953125, -1.9306640625, -1.18505859375, -0.439453125, 0.30615234375, 1.0517578125, 1.79736328125, 2.54296875, 3.28857421875, 4.0341796875, 4.77978515625, 5.525390625, 6.27099609375, 7.0166015625, 7.76220703125, 8.5078125, 9.25341796875, 9.9990234375, 10.74462890625, 11.490234375, 12.23583984375, 12.9814453125, 13.72705078125, 14.47265625, 15.21826171875, 15.9638671875, 16.70947265625, 17.455078125, 18.20068359375, 18.9462890625, 19.69189453125, 20.4375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 4.0, 6.0, 11.0, 9.0, 11.0, 13.0, 37.0, 52.0, 69.0, 82.0, 133.0, 130.0, 119.0, 94.0, 63.0, 44.0, 32.0, 20.0, 13.0, 12.0, 5.0, 10.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.796875, -18.202392578125, -17.60791015625, -17.013427734375, -16.4189453125, -15.824462890625, -15.22998046875, -14.635498046875, -14.041015625, -13.446533203125, -12.85205078125, -12.257568359375, -11.6630859375, -11.068603515625, -10.47412109375, -9.879638671875, -9.28515625, -8.690673828125, -8.09619140625, -7.501708984375, -6.9072265625, -6.312744140625, -5.71826171875, -5.123779296875, -4.529296875, -3.934814453125, -3.34033203125, -2.745849609375, -2.1513671875, -1.556884765625, -0.96240234375, -0.367919921875, 0.2265625, 0.821044921875, 1.41552734375, 2.010009765625, 2.6044921875, 3.198974609375, 3.79345703125, 4.387939453125, 4.982421875, 5.576904296875, 6.17138671875, 6.765869140625, 7.3603515625, 7.954833984375, 8.54931640625, 9.143798828125, 9.73828125, 10.332763671875, 10.92724609375, 11.521728515625, 12.1162109375, 12.710693359375, 13.30517578125, 13.899658203125, 14.494140625, 15.088623046875, 15.68310546875, 16.277587890625, 16.8720703125, 17.466552734375, 18.06103515625, 18.655517578125, 19.25]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 9.0, 23.0, 67.0, 177.0, 331.0, 236.0, 110.0, 47.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.3223876953125, -163.19183349609375, -142.061279296875, -120.93071746826172, -99.80016326904297, -78.66960906982422, -57.53904724121094, -36.40849304199219, -15.277938842773438, 5.852617263793945, 26.983173370361328, 48.113731384277344, 69.2442855834961, 90.37483978271484, 111.50540161132812, 132.63595581054688, 153.76651000976562, 174.89706420898438, 196.02761840820312, 217.15817260742188, 238.28872680664062, 259.4192810058594, 280.54986572265625, 301.680419921875, 322.81097412109375, 343.9415283203125, 365.07208251953125, 386.20263671875, 407.33319091796875, 428.4637451171875, 449.59429931640625, 470.724853515625, 491.85540771484375, 512.9859619140625, 534.1165161132812, 555.2470703125, 576.3776245117188, 597.5081787109375, 618.6387329101562, 639.769287109375, 660.8998413085938, 682.0303955078125, 703.1609497070312, 724.29150390625, 745.4220581054688, 766.5526123046875, 787.6831665039062, 808.813720703125, 829.9443359375, 851.0748901367188, 872.2054443359375, 893.3359985351562, 914.466552734375, 935.5971069335938, 956.7276611328125, 977.8582153320312, 998.98876953125, 1020.1193237304688, 1041.2498779296875, 1062.3804931640625, 1083.510986328125, 1104.6416015625, 1125.7720947265625, 1146.9027099609375, 1168.033203125]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 9.0, 3.0, 8.0, 6.0, 7.0, 7.0, 10.0, 18.0, 13.0, 14.0, 19.0, 21.0, 25.0, 24.0, 24.0, 25.0, 34.0, 39.0, 38.0, 29.0, 38.0, 37.0, 42.0, 36.0, 48.0, 44.0, 36.0, 34.0, 38.0, 38.0, 31.0, 28.0, 19.0, 21.0, 20.0, 22.0, 16.0, 13.0, 15.0, 5.0, 10.0, 10.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-159.8803253173828, -154.90208435058594, -149.92385864257812, -144.94561767578125, -139.96737670898438, -134.9891357421875, -130.01089477539062, -125.03266906738281, -120.05442810058594, -115.07618713378906, -110.09795379638672, -105.11972045898438, -100.1414794921875, -95.16323852539062, -90.18500518798828, -85.20677185058594, -80.22853088378906, -75.25028991699219, -70.27205657958984, -65.2938232421875, -60.315582275390625, -55.337345123291016, -50.359107971191406, -45.3808708190918, -40.40263366699219, -35.42439651489258, -30.44615936279297, -25.46792221069336, -20.48968505859375, -15.51144790649414, -10.533210754394531, -5.554973602294922, -0.57672119140625, 4.401515960693359, 9.379753112792969, 14.357990264892578, 19.336227416992188, 24.314464569091797, 29.292701721191406, 34.270938873291016, 39.249176025390625, 44.227413177490234, 49.205650329589844, 54.18388748168945, 59.16212463378906, 64.14036560058594, 69.11859893798828, 74.09683227539062, 79.0750732421875, 84.05331420898438, 89.03154754638672, 94.00978088378906, 98.98802185058594, 103.96626281738281, 108.94449615478516, 113.9227294921875, 118.90097045898438, 123.87921142578125, 128.85745239257812, 133.83567810058594, 138.8139190673828, 143.7921600341797, 148.7703857421875, 153.74862670898438, 158.72686767578125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 6.0, 5.0, 8.0, 16.0, 4.0, 12.0, 16.0, 27.0, 27.0, 34.0, 65.0, 74.0, 101.0, 114.0, 178.0, 248.0, 347.0, 444.0, 705.0, 1101.0, 1795.0, 3163.0, 5883.0, 12140.0, 30468.0, 109577.0, 3737310.0, 213040.0, 43991.0, 16193.0, 7428.0, 3729.0, 2175.0, 1313.0, 772.0, 504.0, 341.0, 258.0, 185.0, 122.0, 89.0, 71.0, 52.0, 33.0, 37.0, 13.0, 17.0, 8.0, 11.0, 9.0, 6.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0], "bins": [-66.375, -64.3427734375, -62.310546875, -60.2783203125, -58.24609375, -56.2138671875, -54.181640625, -52.1494140625, -50.1171875, -48.0849609375, -46.052734375, -44.0205078125, -41.98828125, -39.9560546875, -37.923828125, -35.8916015625, -33.859375, -31.8271484375, -29.794921875, -27.7626953125, -25.73046875, -23.6982421875, -21.666015625, -19.6337890625, -17.6015625, -15.5693359375, -13.537109375, -11.5048828125, -9.47265625, -7.4404296875, -5.408203125, -3.3759765625, -1.34375, 0.6884765625, 2.720703125, 4.7529296875, 6.78515625, 8.8173828125, 10.849609375, 12.8818359375, 14.9140625, 16.9462890625, 18.978515625, 21.0107421875, 23.04296875, 25.0751953125, 27.107421875, 29.1396484375, 31.171875, 33.2041015625, 35.236328125, 37.2685546875, 39.30078125, 41.3330078125, 43.365234375, 45.3974609375, 47.4296875, 49.4619140625, 51.494140625, 53.5263671875, 55.55859375, 57.5908203125, 59.623046875, 61.6552734375, 63.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 7.0, 5.0, 6.0, 7.0, 8.0, 10.0, 15.0, 8.0, 19.0, 23.0, 14.0, 28.0, 28.0, 32.0, 28.0, 32.0, 38.0, 29.0, 34.0, 39.0, 42.0, 39.0, 41.0, 38.0, 46.0, 39.0, 53.0, 36.0, 32.0, 32.0, 29.0, 23.0, 19.0, 16.0, 19.0, 17.0, 9.0, 15.0, 8.0, 9.0, 10.0, 1.0, 5.0, 8.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.39453125, -7.16351318359375, -6.9324951171875, -6.70147705078125, -6.470458984375, -6.23944091796875, -6.0084228515625, -5.77740478515625, -5.54638671875, -5.31536865234375, -5.0843505859375, -4.85333251953125, -4.622314453125, -4.39129638671875, -4.1602783203125, -3.92926025390625, -3.6982421875, -3.46722412109375, -3.2362060546875, -3.00518798828125, -2.774169921875, -2.54315185546875, -2.3121337890625, -2.08111572265625, -1.85009765625, -1.61907958984375, -1.3880615234375, -1.15704345703125, -0.926025390625, -0.69500732421875, -0.4639892578125, -0.23297119140625, -0.001953125, 0.22906494140625, 0.4600830078125, 0.69110107421875, 0.922119140625, 1.15313720703125, 1.3841552734375, 1.61517333984375, 1.84619140625, 2.07720947265625, 2.3082275390625, 2.53924560546875, 2.770263671875, 3.00128173828125, 3.2322998046875, 3.46331787109375, 3.6943359375, 3.92535400390625, 4.1563720703125, 4.38739013671875, 4.618408203125, 4.84942626953125, 5.0804443359375, 5.31146240234375, 5.54248046875, 5.77349853515625, 6.0045166015625, 6.23553466796875, 6.466552734375, 6.69757080078125, 6.9285888671875, 7.15960693359375, 7.390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 12.0, 11.0, 9.0, 17.0, 22.0, 22.0, 32.0, 52.0, 51.0, 68.0, 76.0, 120.0, 124.0, 186.0, 193.0, 262.0, 342.0, 426.0, 610.0, 895.0, 1483.0, 3126.0, 7892.0, 27869.0, 238192.0, 3801709.0, 82641.0, 16205.0, 5064.0, 2206.0, 1211.0, 705.0, 529.0, 404.0, 281.0, 258.0, 211.0, 172.0, 114.0, 108.0, 82.0, 75.0, 49.0, 38.0, 39.0, 19.0, 24.0, 14.0, 12.0, 10.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-105.0, -101.6455078125, -98.291015625, -94.9365234375, -91.58203125, -88.2275390625, -84.873046875, -81.5185546875, -78.1640625, -74.8095703125, -71.455078125, -68.1005859375, -64.74609375, -61.3916015625, -58.037109375, -54.6826171875, -51.328125, -47.9736328125, -44.619140625, -41.2646484375, -37.91015625, -34.5556640625, -31.201171875, -27.8466796875, -24.4921875, -21.1376953125, -17.783203125, -14.4287109375, -11.07421875, -7.7197265625, -4.365234375, -1.0107421875, 2.34375, 5.6982421875, 9.052734375, 12.4072265625, 15.76171875, 19.1162109375, 22.470703125, 25.8251953125, 29.1796875, 32.5341796875, 35.888671875, 39.2431640625, 42.59765625, 45.9521484375, 49.306640625, 52.6611328125, 56.015625, 59.3701171875, 62.724609375, 66.0791015625, 69.43359375, 72.7880859375, 76.142578125, 79.4970703125, 82.8515625, 86.2060546875, 89.560546875, 92.9150390625, 96.26953125, 99.6240234375, 102.978515625, 106.3330078125, 109.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 9.0, 15.0, 26.0, 49.0, 139.0, 553.0, 2870.0, 263.0, 68.0, 32.0, 18.0, 9.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.90625, -59.986328125, -58.06640625, -56.146484375, -54.2265625, -52.306640625, -50.38671875, -48.466796875, -46.546875, -44.626953125, -42.70703125, -40.787109375, -38.8671875, -36.947265625, -35.02734375, -33.107421875, -31.1875, -29.267578125, -27.34765625, -25.427734375, -23.5078125, -21.587890625, -19.66796875, -17.748046875, -15.828125, -13.908203125, -11.98828125, -10.068359375, -8.1484375, -6.228515625, -4.30859375, -2.388671875, -0.46875, 1.451171875, 3.37109375, 5.291015625, 7.2109375, 9.130859375, 11.05078125, 12.970703125, 14.890625, 16.810546875, 18.73046875, 20.650390625, 22.5703125, 24.490234375, 26.41015625, 28.330078125, 30.25, 32.169921875, 34.08984375, 36.009765625, 37.9296875, 39.849609375, 41.76953125, 43.689453125, 45.609375, 47.529296875, 49.44921875, 51.369140625, 53.2890625, 55.208984375, 57.12890625, 59.048828125, 60.96875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 6.0, 8.0, 14.0, 14.0, 34.0, 33.0, 53.0, 68.0, 108.0, 120.0, 160.0, 122.0, 75.0, 53.0, 40.0, 22.0, 15.0, 21.0, 6.0, 8.0, 9.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.16546630859375, -134.84486389160156, -128.52427673339844, -122.20367431640625, -115.8830795288086, -109.56248474121094, -103.24188232421875, -96.9212875366211, -90.60069274902344, -84.28009796142578, -77.95950317382812, -71.63890075683594, -65.31830596923828, -58.997711181640625, -52.6771125793457, -46.35651397705078, -40.035919189453125, -33.71532440185547, -27.394725799560547, -21.074129104614258, -14.753532409667969, -8.43293571472168, -2.1123390197753906, 4.208259582519531, 10.528854370117188, 16.849451065063477, 23.170047760009766, 29.490644454956055, 35.811241149902344, 42.1318359375, 48.45243453979492, 54.773033142089844, 61.0936279296875, 67.41422271728516, 73.73481750488281, 80.055419921875, 86.37601470947266, 92.69660949707031, 99.0172119140625, 105.33780670166016, 111.65840148925781, 117.97899627685547, 124.29959106445312, 130.6201934814453, 136.9407958984375, 143.26138305664062, 149.5819854736328, 155.902587890625, 162.22317504882812, 168.5437774658203, 174.86436462402344, 181.18496704101562, 187.50555419921875, 193.82615661621094, 200.14675903320312, 206.46734619140625, 212.78794860839844, 219.10855102539062, 225.42913818359375, 231.74974060058594, 238.07034301757812, 244.39093017578125, 250.71153259277344, 257.0321350097656, 263.35272216796875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 5.0, 18.0, 13.0, 13.0, 19.0, 24.0, 19.0, 27.0, 21.0, 36.0, 30.0, 21.0, 37.0, 36.0, 41.0, 37.0, 34.0, 43.0, 49.0, 41.0, 33.0, 44.0, 43.0, 34.0, 35.0, 42.0, 14.0, 20.0, 28.0, 25.0, 22.0, 14.0, 7.0, 9.0, 10.0, 6.0, 7.0, 5.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-112.75352478027344, -109.40979766845703, -106.06607055664062, -102.72233581542969, -99.37860870361328, -96.03488159179688, -92.69115447998047, -89.34742736816406, -86.00369262695312, -82.65996551513672, -79.31623840332031, -75.97250366210938, -72.62877655029297, -69.28504943847656, -65.94132232666016, -62.597591400146484, -59.25386428833008, -55.91013717651367, -52.56640625, -49.222679138183594, -45.87894821166992, -42.535221099853516, -39.191490173339844, -35.84776306152344, -32.50403594970703, -29.160306930541992, -25.816577911376953, -22.472850799560547, -19.129119873046875, -15.785392761230469, -12.44166374206543, -9.09793472290039, -5.754203796386719, -2.410475015640259, 0.9332537651062012, 4.276982307434082, 7.620711326599121, 10.964439392089844, 14.308168411254883, 17.651897430419922, 20.99562644958496, 24.33935546875, 27.68308448791504, 31.026813507080078, 34.370540618896484, 37.714271545410156, 41.05799865722656, 44.40172576904297, 47.74545669555664, 51.08918380737305, 54.43291473388672, 57.776641845703125, 61.1203727722168, 64.46409606933594, 67.80783081054688, 71.15155792236328, 74.49528503417969, 77.8390121459961, 81.1827392578125, 84.52647399902344, 87.87020111083984, 91.21392822265625, 94.55765533447266, 97.90138244628906, 101.2451171875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 11.0, 9.0, 21.0, 26.0, 33.0, 42.0, 53.0, 68.0, 125.0, 172.0, 234.0, 355.0, 505.0, 739.0, 1173.0, 1824.0, 3011.0, 5414.0, 10012.0, 20681.0, 47120.0, 127742.0, 426942.0, 256452.0, 79960.0, 32147.0, 15191.0, 7546.0, 4119.0, 2426.0, 1442.0, 937.0, 609.0, 428.0, 262.0, 192.0, 134.0, 104.0, 80.0, 63.0, 35.0, 26.0, 14.0, 18.0, 9.0, 11.0, 9.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-44.8125, -43.40234375, -41.9921875, -40.58203125, -39.171875, -37.76171875, -36.3515625, -34.94140625, -33.53125, -32.12109375, -30.7109375, -29.30078125, -27.890625, -26.48046875, -25.0703125, -23.66015625, -22.25, -20.83984375, -19.4296875, -18.01953125, -16.609375, -15.19921875, -13.7890625, -12.37890625, -10.96875, -9.55859375, -8.1484375, -6.73828125, -5.328125, -3.91796875, -2.5078125, -1.09765625, 0.3125, 1.72265625, 3.1328125, 4.54296875, 5.953125, 7.36328125, 8.7734375, 10.18359375, 11.59375, 13.00390625, 14.4140625, 15.82421875, 17.234375, 18.64453125, 20.0546875, 21.46484375, 22.875, 24.28515625, 25.6953125, 27.10546875, 28.515625, 29.92578125, 31.3359375, 32.74609375, 34.15625, 35.56640625, 36.9765625, 38.38671875, 39.796875, 41.20703125, 42.6171875, 44.02734375, 45.4375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 8.0, 6.0, 13.0, 17.0, 15.0, 18.0, 25.0, 31.0, 23.0, 29.0, 29.0, 43.0, 35.0, 44.0, 43.0, 46.0, 44.0, 49.0, 48.0, 41.0, 51.0, 35.0, 28.0, 33.0, 39.0, 26.0, 29.0, 19.0, 16.0, 24.0, 13.0, 12.0, 12.0, 9.0, 6.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-11.2734375, -10.94287109375, -10.6123046875, -10.28173828125, -9.951171875, -9.62060546875, -9.2900390625, -8.95947265625, -8.62890625, -8.29833984375, -7.9677734375, -7.63720703125, -7.306640625, -6.97607421875, -6.6455078125, -6.31494140625, -5.984375, -5.65380859375, -5.3232421875, -4.99267578125, -4.662109375, -4.33154296875, -4.0009765625, -3.67041015625, -3.33984375, -3.00927734375, -2.6787109375, -2.34814453125, -2.017578125, -1.68701171875, -1.3564453125, -1.02587890625, -0.6953125, -0.36474609375, -0.0341796875, 0.29638671875, 0.626953125, 0.95751953125, 1.2880859375, 1.61865234375, 1.94921875, 2.27978515625, 2.6103515625, 2.94091796875, 3.271484375, 3.60205078125, 3.9326171875, 4.26318359375, 4.59375, 4.92431640625, 5.2548828125, 5.58544921875, 5.916015625, 6.24658203125, 6.5771484375, 6.90771484375, 7.23828125, 7.56884765625, 7.8994140625, 8.22998046875, 8.560546875, 8.89111328125, 9.2216796875, 9.55224609375, 9.8828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 7.0, 15.0, 21.0, 28.0, 47.0, 79.0, 131.0, 243.0, 387.0, 662.0, 1286.0, 2535.0, 5259.0, 13111.0, 42051.0, 224656.0, 618690.0, 98678.0, 24367.0, 8476.0, 3707.0, 1805.0, 987.0, 531.0, 293.0, 170.0, 121.0, 76.0, 49.0, 22.0, 17.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5, -64.56005859375, -62.6201171875, -60.68017578125, -58.740234375, -56.80029296875, -54.8603515625, -52.92041015625, -50.98046875, -49.04052734375, -47.1005859375, -45.16064453125, -43.220703125, -41.28076171875, -39.3408203125, -37.40087890625, -35.4609375, -33.52099609375, -31.5810546875, -29.64111328125, -27.701171875, -25.76123046875, -23.8212890625, -21.88134765625, -19.94140625, -18.00146484375, -16.0615234375, -14.12158203125, -12.181640625, -10.24169921875, -8.3017578125, -6.36181640625, -4.421875, -2.48193359375, -0.5419921875, 1.39794921875, 3.337890625, 5.27783203125, 7.2177734375, 9.15771484375, 11.09765625, 13.03759765625, 14.9775390625, 16.91748046875, 18.857421875, 20.79736328125, 22.7373046875, 24.67724609375, 26.6171875, 28.55712890625, 30.4970703125, 32.43701171875, 34.376953125, 36.31689453125, 38.2568359375, 40.19677734375, 42.13671875, 44.07666015625, 46.0166015625, 47.95654296875, 49.896484375, 51.83642578125, 53.7763671875, 55.71630859375, 57.65625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 10.0, 6.0, 11.0, 12.0, 9.0, 19.0, 19.0, 21.0, 27.0, 30.0, 32.0, 42.0, 42.0, 56.0, 53.0, 45.0, 68.0, 59.0, 42.0, 46.0, 47.0, 44.0, 39.0, 39.0, 27.0, 24.0, 24.0, 20.0, 18.0, 13.0, 13.0, 7.0, 7.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.09375, -50.39453125, -48.6953125, -46.99609375, -45.296875, -43.59765625, -41.8984375, -40.19921875, -38.5, -36.80078125, -35.1015625, -33.40234375, -31.703125, -30.00390625, -28.3046875, -26.60546875, -24.90625, -23.20703125, -21.5078125, -19.80859375, -18.109375, -16.41015625, -14.7109375, -13.01171875, -11.3125, -9.61328125, -7.9140625, -6.21484375, -4.515625, -2.81640625, -1.1171875, 0.58203125, 2.28125, 3.98046875, 5.6796875, 7.37890625, 9.078125, 10.77734375, 12.4765625, 14.17578125, 15.875, 17.57421875, 19.2734375, 20.97265625, 22.671875, 24.37109375, 26.0703125, 27.76953125, 29.46875, 31.16796875, 32.8671875, 34.56640625, 36.265625, 37.96484375, 39.6640625, 41.36328125, 43.0625, 44.76171875, 46.4609375, 48.16015625, 49.859375, 51.55859375, 53.2578125, 54.95703125, 56.65625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 7.0, 9.0, 22.0, 23.0, 38.0, 37.0, 85.0, 135.0, 221.0, 368.0, 607.0, 1275.0, 2579.0, 5967.0, 16613.0, 65817.0, 520756.0, 360916.0, 49515.0, 13646.0, 5040.0, 2290.0, 1118.0, 594.0, 346.0, 203.0, 101.0, 71.0, 49.0, 37.0, 26.0, 10.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.53125, -24.7783203125, -24.025390625, -23.2724609375, -22.51953125, -21.7666015625, -21.013671875, -20.2607421875, -19.5078125, -18.7548828125, -18.001953125, -17.2490234375, -16.49609375, -15.7431640625, -14.990234375, -14.2373046875, -13.484375, -12.7314453125, -11.978515625, -11.2255859375, -10.47265625, -9.7197265625, -8.966796875, -8.2138671875, -7.4609375, -6.7080078125, -5.955078125, -5.2021484375, -4.44921875, -3.6962890625, -2.943359375, -2.1904296875, -1.4375, -0.6845703125, 0.068359375, 0.8212890625, 1.57421875, 2.3271484375, 3.080078125, 3.8330078125, 4.5859375, 5.3388671875, 6.091796875, 6.8447265625, 7.59765625, 8.3505859375, 9.103515625, 9.8564453125, 10.609375, 11.3623046875, 12.115234375, 12.8681640625, 13.62109375, 14.3740234375, 15.126953125, 15.8798828125, 16.6328125, 17.3857421875, 18.138671875, 18.8916015625, 19.64453125, 20.3974609375, 21.150390625, 21.9033203125, 22.65625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 3.0, 18.0, 19.0, 40.0, 91.0, 280.0, 274.0, 121.0, 57.0, 33.0, 16.0, 16.0, 4.0, 5.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00972747802734375, -0.009354829788208008, -0.008982181549072266, -0.008609533309936523, -0.008236885070800781, -0.007864236831665039, -0.007491588592529297, -0.007118940353393555, -0.0067462921142578125, -0.00637364387512207, -0.006000995635986328, -0.005628347396850586, -0.005255699157714844, -0.0048830509185791016, -0.004510402679443359, -0.004137754440307617, -0.003765106201171875, -0.003392457962036133, -0.0030198097229003906, -0.0026471614837646484, -0.0022745132446289062, -0.001901865005493164, -0.0015292167663574219, -0.0011565685272216797, -0.0007839202880859375, -0.0004112720489501953, -3.8623809814453125e-05, 0.00033402442932128906, 0.0007066726684570312, 0.0010793209075927734, 0.0014519691467285156, 0.0018246173858642578, 0.002197265625, 0.002569913864135742, 0.0029425621032714844, 0.0033152103424072266, 0.0036878585815429688, 0.004060506820678711, 0.004433155059814453, 0.004805803298950195, 0.0051784515380859375, 0.00555109977722168, 0.005923748016357422, 0.006296396255493164, 0.006669044494628906, 0.0070416927337646484, 0.007414340972900391, 0.007786989212036133, 0.008159637451171875, 0.008532285690307617, 0.00890493392944336, 0.009277582168579102, 0.009650230407714844, 0.010022878646850586, 0.010395526885986328, 0.01076817512512207, 0.011140823364257812, 0.011513471603393555, 0.011886119842529297, 0.012258768081665039, 0.012631416320800781, 0.013004064559936523, 0.013376712799072266, 0.013749361038208008, 0.01412200927734375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 6.0, 7.0, 11.0, 14.0, 28.0, 34.0, 52.0, 82.0, 136.0, 173.0, 303.0, 423.0, 689.0, 1074.0, 2022.0, 3475.0, 6974.0, 16102.0, 47111.0, 206575.0, 550518.0, 148252.0, 37211.0, 13483.0, 6035.0, 3118.0, 1740.0, 1033.0, 654.0, 397.0, 241.0, 165.0, 127.0, 89.0, 49.0, 37.0, 31.0, 14.0, 13.0, 8.0, 6.0, 8.0, 4.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.9375, -18.35302734375, -17.7685546875, -17.18408203125, -16.599609375, -16.01513671875, -15.4306640625, -14.84619140625, -14.26171875, -13.67724609375, -13.0927734375, -12.50830078125, -11.923828125, -11.33935546875, -10.7548828125, -10.17041015625, -9.5859375, -9.00146484375, -8.4169921875, -7.83251953125, -7.248046875, -6.66357421875, -6.0791015625, -5.49462890625, -4.91015625, -4.32568359375, -3.7412109375, -3.15673828125, -2.572265625, -1.98779296875, -1.4033203125, -0.81884765625, -0.234375, 0.35009765625, 0.9345703125, 1.51904296875, 2.103515625, 2.68798828125, 3.2724609375, 3.85693359375, 4.44140625, 5.02587890625, 5.6103515625, 6.19482421875, 6.779296875, 7.36376953125, 7.9482421875, 8.53271484375, 9.1171875, 9.70166015625, 10.2861328125, 10.87060546875, 11.455078125, 12.03955078125, 12.6240234375, 13.20849609375, 13.79296875, 14.37744140625, 14.9619140625, 15.54638671875, 16.130859375, 16.71533203125, 17.2998046875, 17.88427734375, 18.46875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 8.0, 5.0, 10.0, 7.0, 11.0, 17.0, 12.0, 24.0, 28.0, 32.0, 41.0, 75.0, 60.0, 83.0, 110.0, 92.0, 91.0, 66.0, 55.0, 33.0, 27.0, 21.0, 16.0, 13.0, 15.0, 10.0, 4.0, 3.0, 6.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.890625, -16.352783203125, -15.81494140625, -15.277099609375, -14.7392578125, -14.201416015625, -13.66357421875, -13.125732421875, -12.587890625, -12.050048828125, -11.51220703125, -10.974365234375, -10.4365234375, -9.898681640625, -9.36083984375, -8.822998046875, -8.28515625, -7.747314453125, -7.20947265625, -6.671630859375, -6.1337890625, -5.595947265625, -5.05810546875, -4.520263671875, -3.982421875, -3.444580078125, -2.90673828125, -2.368896484375, -1.8310546875, -1.293212890625, -0.75537109375, -0.217529296875, 0.3203125, 0.858154296875, 1.39599609375, 1.933837890625, 2.4716796875, 3.009521484375, 3.54736328125, 4.085205078125, 4.623046875, 5.160888671875, 5.69873046875, 6.236572265625, 6.7744140625, 7.312255859375, 7.85009765625, 8.387939453125, 8.92578125, 9.463623046875, 10.00146484375, 10.539306640625, 11.0771484375, 11.614990234375, 12.15283203125, 12.690673828125, 13.228515625, 13.766357421875, 14.30419921875, 14.842041015625, 15.3798828125, 15.917724609375, 16.45556640625, 16.993408203125, 17.53125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 19.0, 18.0, 32.0, 62.0, 82.0, 160.0, 174.0, 143.0, 119.0, 72.0, 47.0, 33.0, 22.0, 6.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-593.1904907226562, -577.7869262695312, -562.38330078125, -546.979736328125, -531.5761108398438, -516.1725463867188, -500.7689514160156, -485.3653564453125, -469.9617614746094, -454.55816650390625, -439.1545715332031, -423.7509765625, -408.347412109375, -392.9438171386719, -377.54022216796875, -362.1366271972656, -346.7330322265625, -331.3294372558594, -315.92584228515625, -300.52227783203125, -285.1186828613281, -269.715087890625, -254.31149291992188, -238.90789794921875, -223.50433349609375, -208.10073852539062, -192.69715881347656, -177.29356384277344, -161.8899688720703, -146.48638916015625, -131.08279418945312, -115.67919921875, -100.27560424804688, -84.87201690673828, -69.46842193603516, -54.06483459472656, -38.6612434387207, -23.257652282714844, -7.85406494140625, 7.549530029296875, 22.95311737060547, 38.35670852661133, 53.76029968261719, 69.16388702392578, 84.56747436523438, 99.9710693359375, 115.3746566772461, 130.77825927734375, 146.1818389892578, 161.58543395996094, 176.989013671875, 192.39260864257812, 207.79620361328125, 223.19979858398438, 238.60337829589844, 254.00697326660156, 269.4105529785156, 284.81414794921875, 300.2177429199219, 315.621337890625, 331.02490234375, 346.4284973144531, 361.83209228515625, 377.2356872558594, 392.6392822265625]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 4.0, 9.0, 8.0, 11.0, 17.0, 17.0, 19.0, 17.0, 38.0, 20.0, 20.0, 27.0, 35.0, 43.0, 48.0, 51.0, 44.0, 38.0, 42.0, 41.0, 51.0, 48.0, 47.0, 44.0, 33.0, 43.0, 28.0, 20.0, 19.0, 21.0, 10.0, 19.0, 9.0, 12.0, 14.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-284.66607666015625, -276.7821350097656, -268.898193359375, -261.0142517089844, -253.1302947998047, -245.24635314941406, -237.36241149902344, -229.4784698486328, -221.59451293945312, -213.7105712890625, -205.82662963867188, -197.94268798828125, -190.05873107910156, -182.17478942871094, -174.2908477783203, -166.4069061279297, -158.52296447753906, -150.63902282714844, -142.7550811767578, -134.87112426757812, -126.9871826171875, -119.10324096679688, -111.21929931640625, -103.33535766601562, -95.45140838623047, -87.56746673583984, -79.68351745605469, -71.79957580566406, -63.91563034057617, -56.03168487548828, -48.147743225097656, -40.263797760009766, -32.379852294921875, -24.495906829833984, -16.611963272094727, -8.728019714355469, -0.8440742492675781, 7.0398712158203125, 14.923812866210938, 22.807758331298828, 30.69170379638672, 38.57564926147461, 46.4595947265625, 54.343536376953125, 62.227481842041016, 70.1114273071289, 77.99536895751953, 85.87931823730469, 93.76325988769531, 101.64720153808594, 109.5311508178711, 117.41509246826172, 125.29904174804688, 133.1829833984375, 141.06692504882812, 148.95086669921875, 156.83480834960938, 164.71875, 172.60269165039062, 180.48663330078125, 188.37059020996094, 196.25453186035156, 204.1384735107422, 212.0224151611328, 219.9063720703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 9.0, 6.0, 7.0, 6.0, 7.0, 9.0, 8.0, 15.0, 23.0, 22.0, 35.0, 45.0, 52.0, 85.0, 110.0, 134.0, 202.0, 229.0, 343.0, 510.0, 735.0, 1082.0, 1665.0, 2543.0, 4464.0, 8500.0, 18487.0, 48152.0, 238041.0, 3690454.0, 115384.0, 33001.0, 13288.0, 6541.0, 3623.0, 2087.0, 1295.0, 946.0, 593.0, 393.0, 315.0, 226.0, 171.0, 101.0, 80.0, 69.0, 47.0, 46.0, 29.0, 19.0, 19.0, 13.0, 6.0, 6.0, 3.0, 7.0, 2.0, 1.0, 5.0, 2.0, 1.0], "bins": [-66.375, -64.3212890625, -62.267578125, -60.2138671875, -58.16015625, -56.1064453125, -54.052734375, -51.9990234375, -49.9453125, -47.8916015625, -45.837890625, -43.7841796875, -41.73046875, -39.6767578125, -37.623046875, -35.5693359375, -33.515625, -31.4619140625, -29.408203125, -27.3544921875, -25.30078125, -23.2470703125, -21.193359375, -19.1396484375, -17.0859375, -15.0322265625, -12.978515625, -10.9248046875, -8.87109375, -6.8173828125, -4.763671875, -2.7099609375, -0.65625, 1.3974609375, 3.451171875, 5.5048828125, 7.55859375, 9.6123046875, 11.666015625, 13.7197265625, 15.7734375, 17.8271484375, 19.880859375, 21.9345703125, 23.98828125, 26.0419921875, 28.095703125, 30.1494140625, 32.203125, 34.2568359375, 36.310546875, 38.3642578125, 40.41796875, 42.4716796875, 44.525390625, 46.5791015625, 48.6328125, 50.6865234375, 52.740234375, 54.7939453125, 56.84765625, 58.9013671875, 60.955078125, 63.0087890625, 65.0625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 3.0, 8.0, 10.0, 14.0, 16.0, 15.0, 17.0, 23.0, 34.0, 40.0, 28.0, 27.0, 38.0, 44.0, 40.0, 50.0, 40.0, 48.0, 42.0, 49.0, 44.0, 41.0, 36.0, 40.0, 32.0, 25.0, 32.0, 26.0, 15.0, 25.0, 20.0, 14.0, 10.0, 8.0, 8.0, 13.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.5899658203125, -9.258056640625, -8.9261474609375, -8.59423828125, -8.2623291015625, -7.930419921875, -7.5985107421875, -7.2666015625, -6.9346923828125, -6.602783203125, -6.2708740234375, -5.93896484375, -5.6070556640625, -5.275146484375, -4.9432373046875, -4.611328125, -4.2794189453125, -3.947509765625, -3.6156005859375, -3.28369140625, -2.9517822265625, -2.619873046875, -2.2879638671875, -1.9560546875, -1.6241455078125, -1.292236328125, -0.9603271484375, -0.62841796875, -0.2965087890625, 0.035400390625, 0.3673095703125, 0.69921875, 1.0311279296875, 1.363037109375, 1.6949462890625, 2.02685546875, 2.3587646484375, 2.690673828125, 3.0225830078125, 3.3544921875, 3.6864013671875, 4.018310546875, 4.3502197265625, 4.68212890625, 5.0140380859375, 5.345947265625, 5.6778564453125, 6.009765625, 6.3416748046875, 6.673583984375, 7.0054931640625, 7.33740234375, 7.6693115234375, 8.001220703125, 8.3331298828125, 8.6650390625, 8.9969482421875, 9.328857421875, 9.6607666015625, 9.99267578125, 10.3245849609375, 10.656494140625, 10.9884033203125, 11.3203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 2.0, 9.0, 8.0, 15.0, 14.0, 25.0, 21.0, 27.0, 34.0, 36.0, 59.0, 70.0, 99.0, 127.0, 214.0, 348.0, 589.0, 1016.0, 2219.0, 6018.0, 26854.0, 1659761.0, 2458543.0, 27167.0, 6051.0, 2233.0, 1064.0, 569.0, 329.0, 180.0, 142.0, 105.0, 77.0, 59.0, 41.0, 34.0, 26.0, 20.0, 21.0, 11.0, 7.0, 9.0, 6.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0], "bins": [-200.375, -194.650390625, -188.92578125, -183.201171875, -177.4765625, -171.751953125, -166.02734375, -160.302734375, -154.578125, -148.853515625, -143.12890625, -137.404296875, -131.6796875, -125.955078125, -120.23046875, -114.505859375, -108.78125, -103.056640625, -97.33203125, -91.607421875, -85.8828125, -80.158203125, -74.43359375, -68.708984375, -62.984375, -57.259765625, -51.53515625, -45.810546875, -40.0859375, -34.361328125, -28.63671875, -22.912109375, -17.1875, -11.462890625, -5.73828125, -0.013671875, 5.7109375, 11.435546875, 17.16015625, 22.884765625, 28.609375, 34.333984375, 40.05859375, 45.783203125, 51.5078125, 57.232421875, 62.95703125, 68.681640625, 74.40625, 80.130859375, 85.85546875, 91.580078125, 97.3046875, 103.029296875, 108.75390625, 114.478515625, 120.203125, 125.927734375, 131.65234375, 137.376953125, 143.1015625, 148.826171875, 154.55078125, 160.275390625, 166.0]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 6.0, 16.0, 36.0, 108.0, 500.0, 3073.0, 213.0, 65.0, 22.0, 11.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.375, -126.8740234375, -123.373046875, -119.8720703125, -116.37109375, -112.8701171875, -109.369140625, -105.8681640625, -102.3671875, -98.8662109375, -95.365234375, -91.8642578125, -88.36328125, -84.8623046875, -81.361328125, -77.8603515625, -74.359375, -70.8583984375, -67.357421875, -63.8564453125, -60.35546875, -56.8544921875, -53.353515625, -49.8525390625, -46.3515625, -42.8505859375, -39.349609375, -35.8486328125, -32.34765625, -28.8466796875, -25.345703125, -21.8447265625, -18.34375, -14.8427734375, -11.341796875, -7.8408203125, -4.33984375, -0.8388671875, 2.662109375, 6.1630859375, 9.6640625, 13.1650390625, 16.666015625, 20.1669921875, 23.66796875, 27.1689453125, 30.669921875, 34.1708984375, 37.671875, 41.1728515625, 44.673828125, 48.1748046875, 51.67578125, 55.1767578125, 58.677734375, 62.1787109375, 65.6796875, 69.1806640625, 72.681640625, 76.1826171875, 79.68359375, 83.1845703125, 86.685546875, 90.1865234375, 93.6875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 4.0, 5.0, 10.0, 8.0, 17.0, 29.0, 55.0, 49.0, 116.0, 150.0, 180.0, 135.0, 83.0, 64.0, 28.0, 27.0, 18.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0], "bins": [-574.7474365234375, -563.2962646484375, -551.8450927734375, -540.3939819335938, -528.9428100585938, -517.4916381835938, -506.04046630859375, -494.58929443359375, -483.1381530761719, -471.6869812011719, -460.23583984375, -448.78466796875, -437.33349609375, -425.8823547363281, -414.4311828613281, -402.98004150390625, -391.52886962890625, -380.07769775390625, -368.6265563964844, -357.1753845214844, -345.7242431640625, -334.2730712890625, -322.8218994140625, -311.3707275390625, -299.9195861816406, -288.4684143066406, -277.01727294921875, -265.56610107421875, -254.1149444580078, -242.66378784179688, -231.21261596679688, -219.76145935058594, -208.310302734375, -196.85914611816406, -185.40798950195312, -173.95681762695312, -162.5056610107422, -151.05450439453125, -139.60333251953125, -128.1521759033203, -116.70101928710938, -105.24986267089844, -93.79869842529297, -82.3475341796875, -70.89637756347656, -59.44521713256836, -47.994056701660156, -36.54289245605469, -25.09173583984375, -13.640575408935547, -2.1894149780273438, 9.26174545288086, 20.712905883789062, 32.164066314697266, 43.61522674560547, 55.06639099121094, 66.51754760742188, 77.96870422363281, 89.41986846923828, 100.87103271484375, 112.32218933105469, 123.77334594726562, 135.22451782226562, 146.67567443847656, 158.1268310546875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 0.0, 3.0, 7.0, 10.0, 5.0, 7.0, 10.0, 10.0, 16.0, 10.0, 16.0, 17.0, 22.0, 26.0, 25.0, 25.0, 31.0, 38.0, 27.0, 30.0, 43.0, 52.0, 34.0, 41.0, 40.0, 52.0, 39.0, 37.0, 43.0, 53.0, 24.0, 24.0, 33.0, 28.0, 15.0, 18.0, 17.0, 13.0, 9.0, 13.0, 5.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-137.32858276367188, -132.5045166015625, -127.68045806884766, -122.85639190673828, -118.03233337402344, -113.20826721191406, -108.38420104980469, -103.56013488769531, -98.73607635498047, -93.9120101928711, -89.08795166015625, -84.26388549804688, -79.4398193359375, -74.61576080322266, -69.79169464111328, -64.96763610839844, -60.14356994628906, -55.31950759887695, -50.495445251464844, -45.67137908935547, -40.84731674194336, -36.02325439453125, -31.199190139770508, -26.375125885009766, -21.551063537597656, -16.727001190185547, -11.902936935424805, -7.078873634338379, -2.254810333251953, 2.5692520141601562, 7.393316268920898, 12.21738052368164, 17.04144287109375, 21.86550521850586, 26.6895694732666, 31.513633728027344, 36.33769607543945, 41.16175842285156, 45.98582458496094, 50.80988693237305, 55.633949279785156, 60.458011627197266, 65.28207397460938, 70.10614013671875, 74.93020629882812, 79.75426483154297, 84.57833099365234, 89.40238952636719, 94.22645568847656, 99.05052185058594, 103.87458038330078, 108.69864654541016, 113.522705078125, 118.34677124023438, 123.17083740234375, 127.99490356445312, 132.8189697265625, 137.64303588867188, 142.46710205078125, 147.29115295410156, 152.11521911621094, 156.9392852783203, 161.7633514404297, 166.58741760253906, 171.41146850585938]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 8.0, 6.0, 10.0, 15.0, 13.0, 20.0, 20.0, 30.0, 47.0, 57.0, 77.0, 109.0, 143.0, 200.0, 260.0, 384.0, 548.0, 902.0, 1465.0, 2783.0, 5954.0, 14397.0, 44557.0, 181452.0, 533318.0, 187892.0, 45758.0, 14840.0, 6142.0, 2835.0, 1556.0, 848.0, 526.0, 372.0, 281.0, 185.0, 135.0, 93.0, 79.0, 63.0, 43.0, 27.0, 27.0, 18.0, 13.0, 14.0, 9.0, 12.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6875, -62.5673828125, -60.447265625, -58.3271484375, -56.20703125, -54.0869140625, -51.966796875, -49.8466796875, -47.7265625, -45.6064453125, -43.486328125, -41.3662109375, -39.24609375, -37.1259765625, -35.005859375, -32.8857421875, -30.765625, -28.6455078125, -26.525390625, -24.4052734375, -22.28515625, -20.1650390625, -18.044921875, -15.9248046875, -13.8046875, -11.6845703125, -9.564453125, -7.4443359375, -5.32421875, -3.2041015625, -1.083984375, 1.0361328125, 3.15625, 5.2763671875, 7.396484375, 9.5166015625, 11.63671875, 13.7568359375, 15.876953125, 17.9970703125, 20.1171875, 22.2373046875, 24.357421875, 26.4775390625, 28.59765625, 30.7177734375, 32.837890625, 34.9580078125, 37.078125, 39.1982421875, 41.318359375, 43.4384765625, 45.55859375, 47.6787109375, 49.798828125, 51.9189453125, 54.0390625, 56.1591796875, 58.279296875, 60.3994140625, 62.51953125, 64.6396484375, 66.759765625, 68.8798828125, 71.0]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 9.0, 9.0, 11.0, 11.0, 18.0, 18.0, 25.0, 26.0, 25.0, 31.0, 37.0, 33.0, 36.0, 49.0, 46.0, 43.0, 59.0, 46.0, 40.0, 48.0, 46.0, 41.0, 29.0, 28.0, 36.0, 19.0, 27.0, 24.0, 19.0, 26.0, 10.0, 14.0, 7.0, 8.0, 11.0, 4.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.734375, -13.307373046875, -12.88037109375, -12.453369140625, -12.0263671875, -11.599365234375, -11.17236328125, -10.745361328125, -10.318359375, -9.891357421875, -9.46435546875, -9.037353515625, -8.6103515625, -8.183349609375, -7.75634765625, -7.329345703125, -6.90234375, -6.475341796875, -6.04833984375, -5.621337890625, -5.1943359375, -4.767333984375, -4.34033203125, -3.913330078125, -3.486328125, -3.059326171875, -2.63232421875, -2.205322265625, -1.7783203125, -1.351318359375, -0.92431640625, -0.497314453125, -0.0703125, 0.356689453125, 0.78369140625, 1.210693359375, 1.6376953125, 2.064697265625, 2.49169921875, 2.918701171875, 3.345703125, 3.772705078125, 4.19970703125, 4.626708984375, 5.0537109375, 5.480712890625, 5.90771484375, 6.334716796875, 6.76171875, 7.188720703125, 7.61572265625, 8.042724609375, 8.4697265625, 8.896728515625, 9.32373046875, 9.750732421875, 10.177734375, 10.604736328125, 11.03173828125, 11.458740234375, 11.8857421875, 12.312744140625, 12.73974609375, 13.166748046875, 13.59375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 12.0, 8.0, 15.0, 13.0, 28.0, 30.0, 30.0, 52.0, 74.0, 82.0, 120.0, 188.0, 248.0, 320.0, 471.0, 752.0, 1245.0, 2312.0, 4969.0, 17254.0, 133697.0, 756982.0, 104769.0, 14629.0, 4547.0, 2116.0, 1174.0, 732.0, 487.0, 333.0, 229.0, 148.0, 109.0, 101.0, 71.0, 53.0, 42.0, 22.0, 22.0, 12.0, 16.0, 10.0, 9.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-117.75, -114.33203125, -110.9140625, -107.49609375, -104.078125, -100.66015625, -97.2421875, -93.82421875, -90.40625, -86.98828125, -83.5703125, -80.15234375, -76.734375, -73.31640625, -69.8984375, -66.48046875, -63.0625, -59.64453125, -56.2265625, -52.80859375, -49.390625, -45.97265625, -42.5546875, -39.13671875, -35.71875, -32.30078125, -28.8828125, -25.46484375, -22.046875, -18.62890625, -15.2109375, -11.79296875, -8.375, -4.95703125, -1.5390625, 1.87890625, 5.296875, 8.71484375, 12.1328125, 15.55078125, 18.96875, 22.38671875, 25.8046875, 29.22265625, 32.640625, 36.05859375, 39.4765625, 42.89453125, 46.3125, 49.73046875, 53.1484375, 56.56640625, 59.984375, 63.40234375, 66.8203125, 70.23828125, 73.65625, 77.07421875, 80.4921875, 83.91015625, 87.328125, 90.74609375, 94.1640625, 97.58203125, 101.0]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 11.0, 7.0, 11.0, 18.0, 20.0, 32.0, 51.0, 61.0, 52.0, 79.0, 83.0, 89.0, 87.0, 80.0, 54.0, 62.0, 56.0, 39.0, 30.0, 27.0, 21.0, 7.0, 9.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.1875, -105.3994140625, -101.611328125, -97.8232421875, -94.03515625, -90.2470703125, -86.458984375, -82.6708984375, -78.8828125, -75.0947265625, -71.306640625, -67.5185546875, -63.73046875, -59.9423828125, -56.154296875, -52.3662109375, -48.578125, -44.7900390625, -41.001953125, -37.2138671875, -33.42578125, -29.6376953125, -25.849609375, -22.0615234375, -18.2734375, -14.4853515625, -10.697265625, -6.9091796875, -3.12109375, 0.6669921875, 4.455078125, 8.2431640625, 12.03125, 15.8193359375, 19.607421875, 23.3955078125, 27.18359375, 30.9716796875, 34.759765625, 38.5478515625, 42.3359375, 46.1240234375, 49.912109375, 53.7001953125, 57.48828125, 61.2763671875, 65.064453125, 68.8525390625, 72.640625, 76.4287109375, 80.216796875, 84.0048828125, 87.79296875, 91.5810546875, 95.369140625, 99.1572265625, 102.9453125, 106.7333984375, 110.521484375, 114.3095703125, 118.09765625, 121.8857421875, 125.673828125, 129.4619140625, 133.25]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 2.0, 6.0, 18.0, 20.0, 28.0, 50.0, 64.0, 98.0, 111.0, 168.0, 224.0, 300.0, 457.0, 697.0, 1009.0, 1563.0, 2407.0, 4398.0, 13033.0, 260732.0, 729620.0, 20205.0, 5289.0, 2718.0, 1759.0, 1078.0, 746.0, 512.0, 365.0, 266.0, 170.0, 119.0, 82.0, 55.0, 49.0, 30.0, 29.0, 18.0, 18.0, 9.0, 10.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.75, -81.05859375, -78.3671875, -75.67578125, -72.984375, -70.29296875, -67.6015625, -64.91015625, -62.21875, -59.52734375, -56.8359375, -54.14453125, -51.453125, -48.76171875, -46.0703125, -43.37890625, -40.6875, -37.99609375, -35.3046875, -32.61328125, -29.921875, -27.23046875, -24.5390625, -21.84765625, -19.15625, -16.46484375, -13.7734375, -11.08203125, -8.390625, -5.69921875, -3.0078125, -0.31640625, 2.375, 5.06640625, 7.7578125, 10.44921875, 13.140625, 15.83203125, 18.5234375, 21.21484375, 23.90625, 26.59765625, 29.2890625, 31.98046875, 34.671875, 37.36328125, 40.0546875, 42.74609375, 45.4375, 48.12890625, 50.8203125, 53.51171875, 56.203125, 58.89453125, 61.5859375, 64.27734375, 66.96875, 69.66015625, 72.3515625, 75.04296875, 77.734375, 80.42578125, 83.1171875, 85.80859375, 88.5]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 17.0, 76.0, 309.0, 448.0, 100.0, 21.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0355224609375, -0.03444957733154297, -0.03337669372558594, -0.032303810119628906, -0.031230926513671875, -0.030158042907714844, -0.029085159301757812, -0.02801227569580078, -0.02693939208984375, -0.02586650848388672, -0.024793624877929688, -0.023720741271972656, -0.022647857666015625, -0.021574974060058594, -0.020502090454101562, -0.01942920684814453, -0.0183563232421875, -0.01728343963623047, -0.016210556030273438, -0.015137672424316406, -0.014064788818359375, -0.012991905212402344, -0.011919021606445312, -0.010846138000488281, -0.00977325439453125, -0.008700370788574219, -0.0076274871826171875, -0.006554603576660156, -0.005481719970703125, -0.004408836364746094, -0.0033359527587890625, -0.0022630691528320312, -0.001190185546875, -0.00011730194091796875, 0.0009555816650390625, 0.0020284652709960938, 0.003101348876953125, 0.004174232482910156, 0.0052471160888671875, 0.006319999694824219, 0.00739288330078125, 0.008465766906738281, 0.009538650512695312, 0.010611534118652344, 0.011684417724609375, 0.012757301330566406, 0.013830184936523438, 0.014903068542480469, 0.0159759521484375, 0.01704883575439453, 0.018121719360351562, 0.019194602966308594, 0.020267486572265625, 0.021340370178222656, 0.022413253784179688, 0.02348613739013672, 0.02455902099609375, 0.02563190460205078, 0.026704788208007812, 0.027777671813964844, 0.028850555419921875, 0.029923439025878906, 0.030996322631835938, 0.03206920623779297, 0.03314208984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 23.0, 18.0, 23.0, 32.0, 63.0, 79.0, 137.0, 261.0, 443.0, 792.0, 1540.0, 2902.0, 6596.0, 39430.0, 929007.0, 53086.0, 7391.0, 3085.0, 1625.0, 861.0, 419.0, 283.0, 165.0, 88.0, 55.0, 45.0, 19.0, 14.0, 16.0, 7.0, 12.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-99.1875, -95.9404296875, -92.693359375, -89.4462890625, -86.19921875, -82.9521484375, -79.705078125, -76.4580078125, -73.2109375, -69.9638671875, -66.716796875, -63.4697265625, -60.22265625, -56.9755859375, -53.728515625, -50.4814453125, -47.234375, -43.9873046875, -40.740234375, -37.4931640625, -34.24609375, -30.9990234375, -27.751953125, -24.5048828125, -21.2578125, -18.0107421875, -14.763671875, -11.5166015625, -8.26953125, -5.0224609375, -1.775390625, 1.4716796875, 4.71875, 7.9658203125, 11.212890625, 14.4599609375, 17.70703125, 20.9541015625, 24.201171875, 27.4482421875, 30.6953125, 33.9423828125, 37.189453125, 40.4365234375, 43.68359375, 46.9306640625, 50.177734375, 53.4248046875, 56.671875, 59.9189453125, 63.166015625, 66.4130859375, 69.66015625, 72.9072265625, 76.154296875, 79.4013671875, 82.6484375, 85.8955078125, 89.142578125, 92.3896484375, 95.63671875, 98.8837890625, 102.130859375, 105.3779296875, 108.625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 6.0, 5.0, 19.0, 35.0, 60.0, 133.0, 267.0, 243.0, 98.0, 47.0, 27.0, 15.0, 10.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.6875, -65.072265625, -62.45703125, -59.841796875, -57.2265625, -54.611328125, -51.99609375, -49.380859375, -46.765625, -44.150390625, -41.53515625, -38.919921875, -36.3046875, -33.689453125, -31.07421875, -28.458984375, -25.84375, -23.228515625, -20.61328125, -17.998046875, -15.3828125, -12.767578125, -10.15234375, -7.537109375, -4.921875, -2.306640625, 0.30859375, 2.923828125, 5.5390625, 8.154296875, 10.76953125, 13.384765625, 16.0, 18.615234375, 21.23046875, 23.845703125, 26.4609375, 29.076171875, 31.69140625, 34.306640625, 36.921875, 39.537109375, 42.15234375, 44.767578125, 47.3828125, 49.998046875, 52.61328125, 55.228515625, 57.84375, 60.458984375, 63.07421875, 65.689453125, 68.3046875, 70.919921875, 73.53515625, 76.150390625, 78.765625, 81.380859375, 83.99609375, 86.611328125, 89.2265625, 91.841796875, 94.45703125, 97.072265625, 99.6875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 9.0, 5.0, 13.0, 9.0, 17.0, 18.0, 23.0, 30.0, 44.0, 65.0, 76.0, 80.0, 98.0, 89.0, 90.0, 88.0, 64.0, 48.0, 28.0, 19.0, 20.0, 17.0, 11.0, 7.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-592.8483276367188, -576.5643310546875, -560.2803955078125, -543.9963989257812, -527.7124633789062, -511.428466796875, -495.1445007324219, -478.86053466796875, -462.5765380859375, -446.2925720214844, -430.00860595703125, -413.724609375, -397.4406433105469, -381.15667724609375, -364.8727111816406, -348.5887451171875, -332.3047790527344, -316.02081298828125, -299.7368469238281, -283.452880859375, -267.16888427734375, -250.88491821289062, -234.6009521484375, -218.31698608398438, -202.0330047607422, -185.74903869628906, -169.46505737304688, -153.18109130859375, -136.89712524414062, -120.61314392089844, -104.32917785644531, -88.04520416259766, -71.76119995117188, -55.47722625732422, -39.19325637817383, -22.909286499023438, -6.625312805175781, 9.658660888671875, 25.942626953125, 42.226600646972656, 58.51057434082031, 74.79454803466797, 91.07852172851562, 107.36248779296875, 123.6464614868164, 139.93043518066406, 156.2144012451172, 172.49838256835938, 188.7823486328125, 205.06631469726562, 221.3502960205078, 237.63426208496094, 253.91824340820312, 270.20220947265625, 286.4861755371094, 302.7701416015625, 319.05413818359375, 335.3381042480469, 351.6220703125, 367.90606689453125, 384.1900329589844, 400.4739990234375, 416.7579650878906, 433.04193115234375, 449.3258972167969]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 5.0, 4.0, 7.0, 5.0, 13.0, 8.0, 8.0, 11.0, 15.0, 17.0, 25.0, 23.0, 27.0, 27.0, 29.0, 23.0, 35.0, 48.0, 27.0, 42.0, 48.0, 50.0, 37.0, 48.0, 32.0, 54.0, 38.0, 28.0, 30.0, 29.0, 17.0, 29.0, 24.0, 23.0, 9.0, 16.0, 15.0, 18.0, 11.0, 10.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-379.4832763671875, -368.2763671875, -357.0694274902344, -345.8625183105469, -334.6556091308594, -323.44866943359375, -312.24176025390625, -301.03485107421875, -289.82794189453125, -278.62103271484375, -267.4140930175781, -256.2071838378906, -245.00027465820312, -233.79335021972656, -222.58642578125, -211.3795166015625, -200.17257690429688, -188.9656524658203, -177.7587432861328, -166.55181884765625, -155.34490966796875, -144.1379852294922, -132.93106079101562, -121.7241439819336, -110.51722717285156, -99.31031036376953, -88.1033935546875, -76.89646911621094, -65.6895523071289, -54.482635498046875, -43.27571105957031, -32.06879425048828, -20.86187744140625, -9.654958724975586, 1.5519599914550781, 12.758880615234375, 23.965797424316406, 35.17271423339844, 46.379638671875, 57.58655548095703, 68.79347229003906, 80.0003890991211, 91.20730590820312, 102.41423034667969, 113.62114715576172, 124.82806396484375, 136.0349884033203, 147.24191284179688, 158.44882202148438, 169.65574645996094, 180.86265563964844, 192.069580078125, 203.2764892578125, 214.48341369628906, 225.69033813476562, 236.89724731445312, 248.1041717529297, 259.31109619140625, 270.51800537109375, 281.72491455078125, 292.9318542480469, 304.1387634277344, 315.345703125, 326.5526123046875, 337.759521484375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 8.0, 9.0, 11.0, 11.0, 12.0, 19.0, 38.0, 46.0, 59.0, 76.0, 165.0, 201.0, 338.0, 578.0, 979.0, 1901.0, 4742.0, 22472.0, 4143452.0, 11966.0, 3424.0, 1537.0, 823.0, 519.0, 281.0, 185.0, 123.0, 87.0, 58.0, 41.0, 22.0, 19.0, 15.0, 10.0, 7.0, 13.0, 3.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-204.5, -198.71484375, -192.9296875, -187.14453125, -181.359375, -175.57421875, -169.7890625, -164.00390625, -158.21875, -152.43359375, -146.6484375, -140.86328125, -135.078125, -129.29296875, -123.5078125, -117.72265625, -111.9375, -106.15234375, -100.3671875, -94.58203125, -88.796875, -83.01171875, -77.2265625, -71.44140625, -65.65625, -59.87109375, -54.0859375, -48.30078125, -42.515625, -36.73046875, -30.9453125, -25.16015625, -19.375, -13.58984375, -7.8046875, -2.01953125, 3.765625, 9.55078125, 15.3359375, 21.12109375, 26.90625, 32.69140625, 38.4765625, 44.26171875, 50.046875, 55.83203125, 61.6171875, 67.40234375, 73.1875, 78.97265625, 84.7578125, 90.54296875, 96.328125, 102.11328125, 107.8984375, 113.68359375, 119.46875, 125.25390625, 131.0390625, 136.82421875, 142.609375, 148.39453125, 154.1796875, 159.96484375, 165.75]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 3.0, 13.0, 16.0, 16.0, 21.0, 22.0, 30.0, 33.0, 34.0, 36.0, 39.0, 52.0, 51.0, 30.0, 53.0, 54.0, 47.0, 60.0, 43.0, 45.0, 37.0, 34.0, 27.0, 28.0, 24.0, 28.0, 25.0, 15.0, 15.0, 7.0, 14.0, 6.0, 11.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.421875, -16.885498046875, -16.34912109375, -15.812744140625, -15.2763671875, -14.739990234375, -14.20361328125, -13.667236328125, -13.130859375, -12.594482421875, -12.05810546875, -11.521728515625, -10.9853515625, -10.448974609375, -9.91259765625, -9.376220703125, -8.83984375, -8.303466796875, -7.76708984375, -7.230712890625, -6.6943359375, -6.157958984375, -5.62158203125, -5.085205078125, -4.548828125, -4.012451171875, -3.47607421875, -2.939697265625, -2.4033203125, -1.866943359375, -1.33056640625, -0.794189453125, -0.2578125, 0.278564453125, 0.81494140625, 1.351318359375, 1.8876953125, 2.424072265625, 2.96044921875, 3.496826171875, 4.033203125, 4.569580078125, 5.10595703125, 5.642333984375, 6.1787109375, 6.715087890625, 7.25146484375, 7.787841796875, 8.32421875, 8.860595703125, 9.39697265625, 9.933349609375, 10.4697265625, 11.006103515625, 11.54248046875, 12.078857421875, 12.615234375, 13.151611328125, 13.68798828125, 14.224365234375, 14.7607421875, 15.297119140625, 15.83349609375, 16.369873046875, 16.90625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 26.0, 28.0, 33.0, 60.0, 70.0, 102.0, 125.0, 171.0, 242.0, 310.0, 458.0, 800.0, 1671.0, 4978.0, 73170.0, 4100556.0, 6623.0, 2044.0, 863.0, 516.0, 348.0, 251.0, 224.0, 140.0, 112.0, 96.0, 60.0, 60.0, 34.0, 27.0, 24.0, 13.0, 10.0, 4.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-217.0, -207.9921875, -198.984375, -189.9765625, -180.96875, -171.9609375, -162.953125, -153.9453125, -144.9375, -135.9296875, -126.921875, -117.9140625, -108.90625, -99.8984375, -90.890625, -81.8828125, -72.875, -63.8671875, -54.859375, -45.8515625, -36.84375, -27.8359375, -18.828125, -9.8203125, -0.8125, 8.1953125, 17.203125, 26.2109375, 35.21875, 44.2265625, 53.234375, 62.2421875, 71.25, 80.2578125, 89.265625, 98.2734375, 107.28125, 116.2890625, 125.296875, 134.3046875, 143.3125, 152.3203125, 161.328125, 170.3359375, 179.34375, 188.3515625, 197.359375, 206.3671875, 215.375, 224.3828125, 233.390625, 242.3984375, 251.40625, 260.4140625, 269.421875, 278.4296875, 287.4375, 296.4453125, 305.453125, 314.4609375, 323.46875, 332.4765625, 341.484375, 350.4921875, 359.5]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 14.0, 46.0, 3904.0, 67.0, 17.0, 7.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.1875, -35.67626953125, -34.1650390625, -32.65380859375, -31.142578125, -29.63134765625, -28.1201171875, -26.60888671875, -25.09765625, -23.58642578125, -22.0751953125, -20.56396484375, -19.052734375, -17.54150390625, -16.0302734375, -14.51904296875, -13.0078125, -11.49658203125, -9.9853515625, -8.47412109375, -6.962890625, -5.45166015625, -3.9404296875, -2.42919921875, -0.91796875, 0.59326171875, 2.1044921875, 3.61572265625, 5.126953125, 6.63818359375, 8.1494140625, 9.66064453125, 11.171875, 12.68310546875, 14.1943359375, 15.70556640625, 17.216796875, 18.72802734375, 20.2392578125, 21.75048828125, 23.26171875, 24.77294921875, 26.2841796875, 27.79541015625, 29.306640625, 30.81787109375, 32.3291015625, 33.84033203125, 35.3515625, 36.86279296875, 38.3740234375, 39.88525390625, 41.396484375, 42.90771484375, 44.4189453125, 45.93017578125, 47.44140625, 48.95263671875, 50.4638671875, 51.97509765625, 53.486328125, 54.99755859375, 56.5087890625, 58.02001953125, 59.53125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 13.0, 19.0, 42.0, 78.0, 149.0, 204.0, 179.0, 118.0, 65.0, 46.0, 24.0, 29.0, 10.0, 4.0, 7.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-242.42698669433594, -235.44906616210938, -228.4711456298828, -221.49322509765625, -214.51528930664062, -207.53738403320312, -200.5594482421875, -193.58152770996094, -186.60360717773438, -179.6256866455078, -172.64776611328125, -165.6698455810547, -158.69192504882812, -151.7139892578125, -144.73606872558594, -137.75814819335938, -130.7802276611328, -123.80230712890625, -116.82438659667969, -109.8464584350586, -102.86853790283203, -95.89061737060547, -88.91268920898438, -81.93476867675781, -74.95684814453125, -67.97892761230469, -61.00100326538086, -54.02307891845703, -47.04515838623047, -40.067237854003906, -33.08931350708008, -26.11138916015625, -19.13348388671875, -12.155561447143555, -5.177639007568359, 1.800283432006836, 8.778205871582031, 15.756126403808594, 22.734050750732422, 29.71197509765625, 36.68989562988281, 43.667816162109375, 50.6457405090332, 57.62366485595703, 64.6015853881836, 71.57950592041016, 78.55743408203125, 85.53535461425781, 92.51327514648438, 99.49119567871094, 106.4691162109375, 113.4470443725586, 120.42496490478516, 127.40288543701172, 134.3808135986328, 141.35873413085938, 148.33665466308594, 155.3145751953125, 162.29249572753906, 169.27041625976562, 176.24835205078125, 183.22625732421875, 190.20419311523438, 197.18211364746094, 204.1600341796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 6.0, 9.0, 5.0, 12.0, 8.0, 8.0, 18.0, 16.0, 18.0, 21.0, 17.0, 22.0, 22.0, 28.0, 41.0, 37.0, 36.0, 33.0, 42.0, 31.0, 33.0, 36.0, 36.0, 25.0, 36.0, 28.0, 31.0, 29.0, 26.0, 27.0, 24.0, 28.0, 24.0, 22.0, 19.0, 15.0, 16.0, 27.0, 14.0, 13.0, 16.0, 5.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-63.00270080566406, -60.92894744873047, -58.855194091796875, -56.78144073486328, -54.70768737792969, -52.633934020996094, -50.5601806640625, -48.486427307128906, -46.41267395019531, -44.33892059326172, -42.265167236328125, -40.19141387939453, -38.11766052246094, -36.043907165527344, -33.97015380859375, -31.896400451660156, -29.822647094726562, -27.74889373779297, -25.675140380859375, -23.60138702392578, -21.527633666992188, -19.453880310058594, -17.380126953125, -15.306373596191406, -13.232620239257812, -11.158866882324219, -9.085113525390625, -7.011360168457031, -4.9376068115234375, -2.8638534545898438, -0.79010009765625, 1.2836532592773438, 3.3574066162109375, 5.431159973144531, 7.504913330078125, 9.578666687011719, 11.652420043945312, 13.726173400878906, 15.7999267578125, 17.873680114746094, 19.947433471679688, 22.02118682861328, 24.094940185546875, 26.16869354248047, 28.242446899414062, 30.316200256347656, 32.38995361328125, 34.463706970214844, 36.53746032714844, 38.61121368408203, 40.684967041015625, 42.75872039794922, 44.83247375488281, 46.906227111816406, 48.97998046875, 51.053733825683594, 53.12748718261719, 55.20124053955078, 57.274993896484375, 59.34874725341797, 61.42250061035156, 63.496253967285156, 65.57000732421875, 67.64376068115234, 69.71751403808594]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 10.0, 15.0, 29.0, 21.0, 29.0, 41.0, 65.0, 89.0, 108.0, 142.0, 201.0, 338.0, 427.0, 677.0, 954.0, 1601.0, 2399.0, 3761.0, 6436.0, 11525.0, 21453.0, 42702.0, 92380.0, 226267.0, 339518.0, 157975.0, 67463.0, 31586.0, 16665.0, 9002.0, 5279.0, 3232.0, 2043.0, 1310.0, 870.0, 574.0, 369.0, 318.0, 200.0, 135.0, 89.0, 66.0, 52.0, 29.0, 26.0, 16.0, 25.0, 14.0, 6.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-48.4375, -46.89013671875, -45.3427734375, -43.79541015625, -42.248046875, -40.70068359375, -39.1533203125, -37.60595703125, -36.05859375, -34.51123046875, -32.9638671875, -31.41650390625, -29.869140625, -28.32177734375, -26.7744140625, -25.22705078125, -23.6796875, -22.13232421875, -20.5849609375, -19.03759765625, -17.490234375, -15.94287109375, -14.3955078125, -12.84814453125, -11.30078125, -9.75341796875, -8.2060546875, -6.65869140625, -5.111328125, -3.56396484375, -2.0166015625, -0.46923828125, 1.078125, 2.62548828125, 4.1728515625, 5.72021484375, 7.267578125, 8.81494140625, 10.3623046875, 11.90966796875, 13.45703125, 15.00439453125, 16.5517578125, 18.09912109375, 19.646484375, 21.19384765625, 22.7412109375, 24.28857421875, 25.8359375, 27.38330078125, 28.9306640625, 30.47802734375, 32.025390625, 33.57275390625, 35.1201171875, 36.66748046875, 38.21484375, 39.76220703125, 41.3095703125, 42.85693359375, 44.404296875, 45.95166015625, 47.4990234375, 49.04638671875, 50.59375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 7.0, 13.0, 9.0, 7.0, 12.0, 22.0, 12.0, 21.0, 33.0, 34.0, 43.0, 44.0, 59.0, 53.0, 52.0, 50.0, 53.0, 53.0, 57.0, 35.0, 44.0, 34.0, 33.0, 32.0, 28.0, 19.0, 18.0, 18.0, 20.0, 25.0, 12.0, 4.0, 8.0, 8.0, 7.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.125, -20.435302734375, -19.74560546875, -19.055908203125, -18.3662109375, -17.676513671875, -16.98681640625, -16.297119140625, -15.607421875, -14.917724609375, -14.22802734375, -13.538330078125, -12.8486328125, -12.158935546875, -11.46923828125, -10.779541015625, -10.08984375, -9.400146484375, -8.71044921875, -8.020751953125, -7.3310546875, -6.641357421875, -5.95166015625, -5.261962890625, -4.572265625, -3.882568359375, -3.19287109375, -2.503173828125, -1.8134765625, -1.123779296875, -0.43408203125, 0.255615234375, 0.9453125, 1.635009765625, 2.32470703125, 3.014404296875, 3.7041015625, 4.393798828125, 5.08349609375, 5.773193359375, 6.462890625, 7.152587890625, 7.84228515625, 8.531982421875, 9.2216796875, 9.911376953125, 10.60107421875, 11.290771484375, 11.98046875, 12.670166015625, 13.35986328125, 14.049560546875, 14.7392578125, 15.428955078125, 16.11865234375, 16.808349609375, 17.498046875, 18.187744140625, 18.87744140625, 19.567138671875, 20.2568359375, 20.946533203125, 21.63623046875, 22.325927734375, 23.015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 10.0, 21.0, 10.0, 23.0, 32.0, 65.0, 83.0, 172.0, 321.0, 479.0, 1048.0, 2382.0, 5725.0, 15785.0, 57909.0, 360688.0, 500628.0, 72490.0, 18831.0, 6627.0, 2598.0, 1261.0, 584.0, 296.0, 181.0, 122.0, 53.0, 43.0, 23.0, 15.0, 19.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.3125, -90.8291015625, -87.345703125, -83.8623046875, -80.37890625, -76.8955078125, -73.412109375, -69.9287109375, -66.4453125, -62.9619140625, -59.478515625, -55.9951171875, -52.51171875, -49.0283203125, -45.544921875, -42.0615234375, -38.578125, -35.0947265625, -31.611328125, -28.1279296875, -24.64453125, -21.1611328125, -17.677734375, -14.1943359375, -10.7109375, -7.2275390625, -3.744140625, -0.2607421875, 3.22265625, 6.7060546875, 10.189453125, 13.6728515625, 17.15625, 20.6396484375, 24.123046875, 27.6064453125, 31.08984375, 34.5732421875, 38.056640625, 41.5400390625, 45.0234375, 48.5068359375, 51.990234375, 55.4736328125, 58.95703125, 62.4404296875, 65.923828125, 69.4072265625, 72.890625, 76.3740234375, 79.857421875, 83.3408203125, 86.82421875, 90.3076171875, 93.791015625, 97.2744140625, 100.7578125, 104.2412109375, 107.724609375, 111.2080078125, 114.69140625, 118.1748046875, 121.658203125, 125.1416015625, 128.625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 11.0, 19.0, 17.0, 25.0, 30.0, 21.0, 40.0, 47.0, 41.0, 37.0, 59.0, 60.0, 49.0, 45.0, 60.0, 69.0, 56.0, 53.0, 35.0, 39.0, 29.0, 41.0, 21.0, 15.0, 14.0, 9.0, 16.0, 7.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.375, -110.953125, -106.53125, -102.109375, -97.6875, -93.265625, -88.84375, -84.421875, -80.0, -75.578125, -71.15625, -66.734375, -62.3125, -57.890625, -53.46875, -49.046875, -44.625, -40.203125, -35.78125, -31.359375, -26.9375, -22.515625, -18.09375, -13.671875, -9.25, -4.828125, -0.40625, 4.015625, 8.4375, 12.859375, 17.28125, 21.703125, 26.125, 30.546875, 34.96875, 39.390625, 43.8125, 48.234375, 52.65625, 57.078125, 61.5, 65.921875, 70.34375, 74.765625, 79.1875, 83.609375, 88.03125, 92.453125, 96.875, 101.296875, 105.71875, 110.140625, 114.5625, 118.984375, 123.40625, 127.828125, 132.25, 136.671875, 141.09375, 145.515625, 149.9375, 154.359375, 158.78125, 163.203125, 167.625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 12.0, 19.0, 21.0, 32.0, 36.0, 60.0, 88.0, 135.0, 205.0, 317.0, 487.0, 760.0, 1308.0, 2339.0, 4898.0, 12149.0, 43821.0, 447540.0, 466531.0, 44751.0, 12244.0, 4868.0, 2347.0, 1378.0, 775.0, 442.0, 321.0, 173.0, 155.0, 108.0, 66.0, 42.0, 44.0, 19.0, 16.0, 13.0, 7.0, 4.0, 5.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.59375, -52.8330078125, -51.072265625, -49.3115234375, -47.55078125, -45.7900390625, -44.029296875, -42.2685546875, -40.5078125, -38.7470703125, -36.986328125, -35.2255859375, -33.46484375, -31.7041015625, -29.943359375, -28.1826171875, -26.421875, -24.6611328125, -22.900390625, -21.1396484375, -19.37890625, -17.6181640625, -15.857421875, -14.0966796875, -12.3359375, -10.5751953125, -8.814453125, -7.0537109375, -5.29296875, -3.5322265625, -1.771484375, -0.0107421875, 1.75, 3.5107421875, 5.271484375, 7.0322265625, 8.79296875, 10.5537109375, 12.314453125, 14.0751953125, 15.8359375, 17.5966796875, 19.357421875, 21.1181640625, 22.87890625, 24.6396484375, 26.400390625, 28.1611328125, 29.921875, 31.6826171875, 33.443359375, 35.2041015625, 36.96484375, 38.7255859375, 40.486328125, 42.2470703125, 44.0078125, 45.7685546875, 47.529296875, 49.2900390625, 51.05078125, 52.8115234375, 54.572265625, 56.3330078125, 58.09375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 3.0, 9.0, 15.0, 19.0, 19.0, 23.0, 34.0, 58.0, 78.0, 99.0, 131.0, 120.0, 108.0, 76.0, 51.0, 40.0, 25.0, 13.0, 26.0, 13.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01082611083984375, -0.01050722599029541, -0.01018834114074707, -0.00986945629119873, -0.00955057144165039, -0.00923168659210205, -0.008912801742553711, -0.008593916893005371, -0.008275032043457031, -0.007956147193908691, -0.0076372623443603516, -0.007318377494812012, -0.006999492645263672, -0.006680607795715332, -0.006361722946166992, -0.006042838096618652, -0.0057239532470703125, -0.005405068397521973, -0.005086183547973633, -0.004767298698425293, -0.004448413848876953, -0.004129528999328613, -0.0038106441497802734, -0.0034917593002319336, -0.0031728744506835938, -0.002853989601135254, -0.002535104751586914, -0.0022162199020385742, -0.0018973350524902344, -0.0015784502029418945, -0.0012595653533935547, -0.0009406805038452148, -0.000621795654296875, -0.00030291080474853516, 1.5974044799804688e-05, 0.00033485889434814453, 0.0006537437438964844, 0.0009726285934448242, 0.001291513442993164, 0.001610398292541504, 0.0019292831420898438, 0.0022481679916381836, 0.0025670528411865234, 0.0028859376907348633, 0.003204822540283203, 0.003523707389831543, 0.003842592239379883, 0.004161477088928223, 0.0044803619384765625, 0.004799246788024902, 0.005118131637573242, 0.005437016487121582, 0.005755901336669922, 0.006074786186218262, 0.0063936710357666016, 0.006712555885314941, 0.007031440734863281, 0.007350325584411621, 0.007669210433959961, 0.0079880952835083, 0.00830698013305664, 0.00862586498260498, 0.00894474983215332, 0.00926363468170166, 0.00958251953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 5.0, 6.0, 14.0, 15.0, 17.0, 38.0, 64.0, 101.0, 148.0, 348.0, 757.0, 1928.0, 7195.0, 44423.0, 837202.0, 137676.0, 13348.0, 3145.0, 1113.0, 454.0, 242.0, 100.0, 83.0, 42.0, 28.0, 21.0, 10.0, 9.0, 5.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.8125, -102.7626953125, -99.712890625, -96.6630859375, -93.61328125, -90.5634765625, -87.513671875, -84.4638671875, -81.4140625, -78.3642578125, -75.314453125, -72.2646484375, -69.21484375, -66.1650390625, -63.115234375, -60.0654296875, -57.015625, -53.9658203125, -50.916015625, -47.8662109375, -44.81640625, -41.7666015625, -38.716796875, -35.6669921875, -32.6171875, -29.5673828125, -26.517578125, -23.4677734375, -20.41796875, -17.3681640625, -14.318359375, -11.2685546875, -8.21875, -5.1689453125, -2.119140625, 0.9306640625, 3.98046875, 7.0302734375, 10.080078125, 13.1298828125, 16.1796875, 19.2294921875, 22.279296875, 25.3291015625, 28.37890625, 31.4287109375, 34.478515625, 37.5283203125, 40.578125, 43.6279296875, 46.677734375, 49.7275390625, 52.77734375, 55.8271484375, 58.876953125, 61.9267578125, 64.9765625, 68.0263671875, 71.076171875, 74.1259765625, 77.17578125, 80.2255859375, 83.275390625, 86.3251953125, 89.375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 11.0, 12.0, 16.0, 31.0, 51.0, 88.0, 141.0, 196.0, 171.0, 109.0, 57.0, 28.0, 23.0, 17.0, 9.0, 12.0, 9.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-113.9375, -111.3330078125, -108.728515625, -106.1240234375, -103.51953125, -100.9150390625, -98.310546875, -95.7060546875, -93.1015625, -90.4970703125, -87.892578125, -85.2880859375, -82.68359375, -80.0791015625, -77.474609375, -74.8701171875, -72.265625, -69.6611328125, -67.056640625, -64.4521484375, -61.84765625, -59.2431640625, -56.638671875, -54.0341796875, -51.4296875, -48.8251953125, -46.220703125, -43.6162109375, -41.01171875, -38.4072265625, -35.802734375, -33.1982421875, -30.59375, -27.9892578125, -25.384765625, -22.7802734375, -20.17578125, -17.5712890625, -14.966796875, -12.3623046875, -9.7578125, -7.1533203125, -4.548828125, -1.9443359375, 0.66015625, 3.2646484375, 5.869140625, 8.4736328125, 11.078125, 13.6826171875, 16.287109375, 18.8916015625, 21.49609375, 24.1005859375, 26.705078125, 29.3095703125, 31.9140625, 34.5185546875, 37.123046875, 39.7275390625, 42.33203125, 44.9365234375, 47.541015625, 50.1455078125, 52.75]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 16.0, 21.0, 27.0, 49.0, 58.0, 83.0, 134.0, 152.0, 152.0, 110.0, 73.0, 56.0, 34.0, 13.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-520.7315063476562, -487.66729736328125, -454.60308837890625, -421.53887939453125, -388.47467041015625, -355.41046142578125, -322.3462829589844, -289.2820739746094, -256.2178649902344, -223.15365600585938, -190.08944702148438, -157.02525329589844, -123.96104431152344, -90.89683532714844, -57.8326416015625, -24.7684326171875, 8.2957763671875, 41.359981536865234, 74.42418670654297, 107.48838806152344, 140.55259704589844, 173.61680603027344, 206.68099975585938, 239.74520874023438, 272.8094177246094, 305.8736267089844, 338.9378356933594, 372.00201416015625, 405.06622314453125, 438.13043212890625, 471.19464111328125, 504.25885009765625, 537.322998046875, 570.38720703125, 603.451416015625, 636.515625, 669.579833984375, 702.64404296875, 735.708251953125, 768.7724609375, 801.836669921875, 834.90087890625, 867.965087890625, 901.029296875, 934.093505859375, 967.15771484375, 1000.221923828125, 1033.2861328125, 1066.350341796875, 1099.41455078125, 1132.478759765625, 1165.54296875, 1198.607177734375, 1231.67138671875, 1264.735595703125, 1297.7998046875, 1330.8638916015625, 1363.9281005859375, 1396.9923095703125, 1430.0565185546875, 1463.1207275390625, 1496.1849365234375, 1529.2491455078125, 1562.3133544921875, 1595.3775634765625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 1.0, 7.0, 6.0, 11.0, 12.0, 13.0, 13.0, 16.0, 22.0, 20.0, 18.0, 22.0, 22.0, 25.0, 33.0, 42.0, 33.0, 39.0, 33.0, 38.0, 56.0, 40.0, 45.0, 40.0, 33.0, 31.0, 32.0, 41.0, 27.0, 32.0, 20.0, 18.0, 21.0, 25.0, 22.0, 12.0, 11.0, 14.0, 7.0, 11.0, 10.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-495.1510009765625, -478.4688720703125, -461.7867431640625, -445.1046142578125, -428.4224853515625, -411.7403564453125, -395.0581970214844, -378.3760681152344, -361.6939392089844, -345.0118103027344, -328.3296813964844, -311.6475524902344, -294.96539306640625, -278.28326416015625, -261.60113525390625, -244.91900634765625, -228.23687744140625, -211.55474853515625, -194.87261962890625, -178.1904754638672, -161.5083465576172, -144.8262176513672, -128.14407348632812, -111.46194458007812, -94.77981567382812, -78.09768676757812, -61.415550231933594, -44.73341751098633, -28.051284790039062, -11.369155883789062, 5.312980651855469, 21.9951171875, 38.67718505859375, 55.359317779541016, 72.04145050048828, 88.72358703613281, 105.40571594238281, 122.08784484863281, 138.76998901367188, 155.45211791992188, 172.13424682617188, 188.81637573242188, 205.49850463867188, 222.18064880371094, 238.86277770996094, 255.54490661621094, 272.22705078125, 288.9091796875, 305.59130859375, 322.2734375, 338.95556640625, 355.6376953125, 372.31982421875, 389.001953125, 405.6841125488281, 422.3662414550781, 439.0483703613281, 455.7304992675781, 472.4126281738281, 489.0947570800781, 505.77691650390625, 522.4590454101562, 539.1411743164062, 555.8233032226562, 572.5054321289062]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 10.0, 16.0, 13.0, 32.0, 30.0, 74.0, 95.0, 128.0, 173.0, 250.0, 429.0, 611.0, 999.0, 1661.0, 3899.0, 27188.0, 4144708.0, 7958.0, 2359.0, 1242.0, 792.0, 535.0, 332.0, 260.0, 145.0, 95.0, 81.0, 55.0, 32.0, 23.0, 14.0, 8.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-259.5, -252.71484375, -245.9296875, -239.14453125, -232.359375, -225.57421875, -218.7890625, -212.00390625, -205.21875, -198.43359375, -191.6484375, -184.86328125, -178.078125, -171.29296875, -164.5078125, -157.72265625, -150.9375, -144.15234375, -137.3671875, -130.58203125, -123.796875, -117.01171875, -110.2265625, -103.44140625, -96.65625, -89.87109375, -83.0859375, -76.30078125, -69.515625, -62.73046875, -55.9453125, -49.16015625, -42.375, -35.58984375, -28.8046875, -22.01953125, -15.234375, -8.44921875, -1.6640625, 5.12109375, 11.90625, 18.69140625, 25.4765625, 32.26171875, 39.046875, 45.83203125, 52.6171875, 59.40234375, 66.1875, 72.97265625, 79.7578125, 86.54296875, 93.328125, 100.11328125, 106.8984375, 113.68359375, 120.46875, 127.25390625, 134.0390625, 140.82421875, 147.609375, 154.39453125, 161.1796875, 167.96484375, 174.75]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 7.0, 5.0, 10.0, 15.0, 20.0, 25.0, 15.0, 26.0, 33.0, 39.0, 47.0, 44.0, 42.0, 54.0, 55.0, 56.0, 53.0, 57.0, 44.0, 43.0, 55.0, 42.0, 41.0, 31.0, 28.0, 28.0, 14.0, 16.0, 14.0, 13.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.772216796875, -19.99755859375, -19.222900390625, -18.4482421875, -17.673583984375, -16.89892578125, -16.124267578125, -15.349609375, -14.574951171875, -13.80029296875, -13.025634765625, -12.2509765625, -11.476318359375, -10.70166015625, -9.927001953125, -9.15234375, -8.377685546875, -7.60302734375, -6.828369140625, -6.0537109375, -5.279052734375, -4.50439453125, -3.729736328125, -2.955078125, -2.180419921875, -1.40576171875, -0.631103515625, 0.1435546875, 0.918212890625, 1.69287109375, 2.467529296875, 3.2421875, 4.016845703125, 4.79150390625, 5.566162109375, 6.3408203125, 7.115478515625, 7.89013671875, 8.664794921875, 9.439453125, 10.214111328125, 10.98876953125, 11.763427734375, 12.5380859375, 13.312744140625, 14.08740234375, 14.862060546875, 15.63671875, 16.411376953125, 17.18603515625, 17.960693359375, 18.7353515625, 19.510009765625, 20.28466796875, 21.059326171875, 21.833984375, 22.608642578125, 23.38330078125, 24.157958984375, 24.9326171875, 25.707275390625, 26.48193359375, 27.256591796875, 28.03125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 8.0, 9.0, 9.0, 15.0, 18.0, 22.0, 36.0, 45.0, 41.0, 85.0, 102.0, 172.0, 281.0, 551.0, 1349.0, 3994.0, 22458.0, 4147232.0, 12589.0, 2977.0, 1049.0, 433.0, 262.0, 151.0, 99.0, 68.0, 56.0, 49.0, 31.0, 21.0, 21.0, 10.0, 8.0, 9.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-309.0, -300.01171875, -291.0234375, -282.03515625, -273.046875, -264.05859375, -255.0703125, -246.08203125, -237.09375, -228.10546875, -219.1171875, -210.12890625, -201.140625, -192.15234375, -183.1640625, -174.17578125, -165.1875, -156.19921875, -147.2109375, -138.22265625, -129.234375, -120.24609375, -111.2578125, -102.26953125, -93.28125, -84.29296875, -75.3046875, -66.31640625, -57.328125, -48.33984375, -39.3515625, -30.36328125, -21.375, -12.38671875, -3.3984375, 5.58984375, 14.578125, 23.56640625, 32.5546875, 41.54296875, 50.53125, 59.51953125, 68.5078125, 77.49609375, 86.484375, 95.47265625, 104.4609375, 113.44921875, 122.4375, 131.42578125, 140.4140625, 149.40234375, 158.390625, 167.37890625, 176.3671875, 185.35546875, 194.34375, 203.33203125, 212.3203125, 221.30859375, 230.296875, 239.28515625, 248.2734375, 257.26171875, 266.25]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 45.0, 3845.0, 123.0, 15.0, 12.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0625, -73.22314453125, -71.3837890625, -69.54443359375, -67.705078125, -65.86572265625, -64.0263671875, -62.18701171875, -60.34765625, -58.50830078125, -56.6689453125, -54.82958984375, -52.990234375, -51.15087890625, -49.3115234375, -47.47216796875, -45.6328125, -43.79345703125, -41.9541015625, -40.11474609375, -38.275390625, -36.43603515625, -34.5966796875, -32.75732421875, -30.91796875, -29.07861328125, -27.2392578125, -25.39990234375, -23.560546875, -21.72119140625, -19.8818359375, -18.04248046875, -16.203125, -14.36376953125, -12.5244140625, -10.68505859375, -8.845703125, -7.00634765625, -5.1669921875, -3.32763671875, -1.48828125, 0.35107421875, 2.1904296875, 4.02978515625, 5.869140625, 7.70849609375, 9.5478515625, 11.38720703125, 13.2265625, 15.06591796875, 16.9052734375, 18.74462890625, 20.583984375, 22.42333984375, 24.2626953125, 26.10205078125, 27.94140625, 29.78076171875, 31.6201171875, 33.45947265625, 35.298828125, 37.13818359375, 38.9775390625, 40.81689453125, 42.65625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 7.0, 5.0, 5.0, 5.0, 6.0, 13.0, 14.0, 22.0, 23.0, 17.0, 42.0, 44.0, 59.0, 69.0, 78.0, 95.0, 96.0, 77.0, 72.0, 73.0, 48.0, 43.0, 22.0, 19.0, 10.0, 15.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-117.26155090332031, -114.4413070678711, -111.62106323242188, -108.80081939697266, -105.98057556152344, -103.16033172607422, -100.340087890625, -97.51983642578125, -94.69960021972656, -91.87935638427734, -89.05911254882812, -86.2388687133789, -83.41862487792969, -80.59838104248047, -77.77813720703125, -74.9578857421875, -72.13764190673828, -69.31739807128906, -66.49715423583984, -63.676910400390625, -60.856666564941406, -58.03642272949219, -55.2161750793457, -52.395931243896484, -49.575687408447266, -46.75544357299805, -43.93519973754883, -41.114952087402344, -38.294708251953125, -35.474464416503906, -32.65422058105469, -29.83397674560547, -27.013736724853516, -24.193492889404297, -21.373249053955078, -18.553003311157227, -15.732759475708008, -12.912515640258789, -10.092269897460938, -7.272026062011719, -4.4517822265625, -1.631537914276123, 1.188706398010254, 4.008951187133789, 6.829195022583008, 9.649438858032227, 12.469684600830078, 15.289928436279297, 18.110172271728516, 20.930416107177734, 23.750659942626953, 26.570905685424805, 29.391149520874023, 32.211395263671875, 35.031639099121094, 37.85188293457031, 40.67212677001953, 43.49237060546875, 46.31261444091797, 49.13285827636719, 51.953102111816406, 54.773345947265625, 57.59359359741211, 60.41383743286133, 63.23408126831055]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 6.0, 8.0, 11.0, 14.0, 22.0, 14.0, 23.0, 31.0, 29.0, 37.0, 32.0, 39.0, 31.0, 44.0, 47.0, 56.0, 49.0, 53.0, 50.0, 45.0, 46.0, 38.0, 35.0, 46.0, 31.0, 30.0, 22.0, 8.0, 14.0, 16.0, 21.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-85.15863037109375, -82.89708709716797, -80.63554382324219, -78.3740005493164, -76.11245727539062, -73.85091400146484, -71.58937072753906, -69.32783508300781, -67.0662841796875, -64.80474090576172, -62.54319763183594, -60.281654357910156, -58.020111083984375, -55.758567810058594, -53.49702835083008, -51.2354850769043, -48.97394561767578, -46.71240234375, -44.45085906982422, -42.18931579589844, -39.927772521972656, -37.666229248046875, -35.40468978881836, -33.14314651489258, -30.881603240966797, -28.620059967041016, -26.358516693115234, -24.096975326538086, -21.835432052612305, -19.573888778686523, -17.312347412109375, -15.050804138183594, -12.789268493652344, -10.527725219726562, -8.266182899475098, -6.004640102386475, -3.7430973052978516, -1.4815540313720703, 0.7799882888793945, 3.0415306091308594, 5.303073883056641, 7.564616680145264, 9.826159477233887, 12.087701797485352, 14.349245071411133, 16.610788345336914, 18.872329711914062, 21.133872985839844, 23.395416259765625, 25.656959533691406, 27.918502807617188, 30.180044174194336, 32.44158935546875, 34.70313262939453, 36.96467208862305, 39.22621536254883, 41.48775863647461, 43.74930191040039, 46.01084518432617, 48.27238845825195, 50.53392791748047, 52.79547119140625, 55.05701446533203, 57.31855773925781, 59.580101013183594]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 11.0, 13.0, 11.0, 15.0, 42.0, 47.0, 72.0, 87.0, 138.0, 188.0, 281.0, 457.0, 721.0, 1123.0, 1815.0, 2907.0, 5179.0, 9397.0, 18051.0, 37886.0, 87937.0, 229442.0, 362427.0, 163511.0, 65109.0, 29188.0, 14100.0, 7503.0, 4252.0, 2509.0, 1451.0, 906.0, 597.0, 391.0, 263.0, 175.0, 112.0, 74.0, 48.0, 27.0, 22.0, 23.0, 13.0, 10.0, 14.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.34375, -53.7314453125, -52.119140625, -50.5068359375, -48.89453125, -47.2822265625, -45.669921875, -44.0576171875, -42.4453125, -40.8330078125, -39.220703125, -37.6083984375, -35.99609375, -34.3837890625, -32.771484375, -31.1591796875, -29.546875, -27.9345703125, -26.322265625, -24.7099609375, -23.09765625, -21.4853515625, -19.873046875, -18.2607421875, -16.6484375, -15.0361328125, -13.423828125, -11.8115234375, -10.19921875, -8.5869140625, -6.974609375, -5.3623046875, -3.75, -2.1376953125, -0.525390625, 1.0869140625, 2.69921875, 4.3115234375, 5.923828125, 7.5361328125, 9.1484375, 10.7607421875, 12.373046875, 13.9853515625, 15.59765625, 17.2099609375, 18.822265625, 20.4345703125, 22.046875, 23.6591796875, 25.271484375, 26.8837890625, 28.49609375, 30.1083984375, 31.720703125, 33.3330078125, 34.9453125, 36.5576171875, 38.169921875, 39.7822265625, 41.39453125, 43.0068359375, 44.619140625, 46.2314453125, 47.84375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 1.0, 8.0, 6.0, 12.0, 14.0, 9.0, 10.0, 17.0, 19.0, 26.0, 29.0, 45.0, 42.0, 52.0, 38.0, 44.0, 45.0, 57.0, 54.0, 64.0, 46.0, 39.0, 31.0, 52.0, 36.0, 32.0, 39.0, 35.0, 21.0, 14.0, 13.0, 12.0, 13.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.25, -25.45751953125, -24.6650390625, -23.87255859375, -23.080078125, -22.28759765625, -21.4951171875, -20.70263671875, -19.91015625, -19.11767578125, -18.3251953125, -17.53271484375, -16.740234375, -15.94775390625, -15.1552734375, -14.36279296875, -13.5703125, -12.77783203125, -11.9853515625, -11.19287109375, -10.400390625, -9.60791015625, -8.8154296875, -8.02294921875, -7.23046875, -6.43798828125, -5.6455078125, -4.85302734375, -4.060546875, -3.26806640625, -2.4755859375, -1.68310546875, -0.890625, -0.09814453125, 0.6943359375, 1.48681640625, 2.279296875, 3.07177734375, 3.8642578125, 4.65673828125, 5.44921875, 6.24169921875, 7.0341796875, 7.82666015625, 8.619140625, 9.41162109375, 10.2041015625, 10.99658203125, 11.7890625, 12.58154296875, 13.3740234375, 14.16650390625, 14.958984375, 15.75146484375, 16.5439453125, 17.33642578125, 18.12890625, 18.92138671875, 19.7138671875, 20.50634765625, 21.298828125, 22.09130859375, 22.8837890625, 23.67626953125, 24.46875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 9.0, 16.0, 14.0, 24.0, 44.0, 43.0, 75.0, 107.0, 172.0, 338.0, 609.0, 1128.0, 2532.0, 6139.0, 17477.0, 65167.0, 406382.0, 447755.0, 70184.0, 18651.0, 6380.0, 2559.0, 1233.0, 581.0, 316.0, 204.0, 119.0, 92.0, 42.0, 31.0, 28.0, 21.0, 15.0, 8.0, 3.0, 10.0, 4.0, 4.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.75, -95.84765625, -92.9453125, -90.04296875, -87.140625, -84.23828125, -81.3359375, -78.43359375, -75.53125, -72.62890625, -69.7265625, -66.82421875, -63.921875, -61.01953125, -58.1171875, -55.21484375, -52.3125, -49.41015625, -46.5078125, -43.60546875, -40.703125, -37.80078125, -34.8984375, -31.99609375, -29.09375, -26.19140625, -23.2890625, -20.38671875, -17.484375, -14.58203125, -11.6796875, -8.77734375, -5.875, -2.97265625, -0.0703125, 2.83203125, 5.734375, 8.63671875, 11.5390625, 14.44140625, 17.34375, 20.24609375, 23.1484375, 26.05078125, 28.953125, 31.85546875, 34.7578125, 37.66015625, 40.5625, 43.46484375, 46.3671875, 49.26953125, 52.171875, 55.07421875, 57.9765625, 60.87890625, 63.78125, 66.68359375, 69.5859375, 72.48828125, 75.390625, 78.29296875, 81.1953125, 84.09765625, 87.0]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 3.0, 7.0, 12.0, 8.0, 11.0, 13.0, 11.0, 19.0, 22.0, 28.0, 29.0, 19.0, 30.0, 29.0, 40.0, 33.0, 41.0, 47.0, 51.0, 47.0, 44.0, 44.0, 38.0, 41.0, 40.0, 45.0, 32.0, 32.0, 35.0, 25.0, 27.0, 15.0, 10.0, 18.0, 11.0, 9.0, 10.0, 5.0, 6.0, 2.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.0, -90.6435546875, -87.287109375, -83.9306640625, -80.57421875, -77.2177734375, -73.861328125, -70.5048828125, -67.1484375, -63.7919921875, -60.435546875, -57.0791015625, -53.72265625, -50.3662109375, -47.009765625, -43.6533203125, -40.296875, -36.9404296875, -33.583984375, -30.2275390625, -26.87109375, -23.5146484375, -20.158203125, -16.8017578125, -13.4453125, -10.0888671875, -6.732421875, -3.3759765625, -0.01953125, 3.3369140625, 6.693359375, 10.0498046875, 13.40625, 16.7626953125, 20.119140625, 23.4755859375, 26.83203125, 30.1884765625, 33.544921875, 36.9013671875, 40.2578125, 43.6142578125, 46.970703125, 50.3271484375, 53.68359375, 57.0400390625, 60.396484375, 63.7529296875, 67.109375, 70.4658203125, 73.822265625, 77.1787109375, 80.53515625, 83.8916015625, 87.248046875, 90.6044921875, 93.9609375, 97.3173828125, 100.673828125, 104.0302734375, 107.38671875, 110.7431640625, 114.099609375, 117.4560546875, 120.8125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 13.0, 17.0, 32.0, 33.0, 60.0, 104.0, 189.0, 337.0, 693.0, 1532.0, 4421.0, 23280.0, 697940.0, 298463.0, 15371.0, 3467.0, 1261.0, 574.0, 317.0, 164.0, 90.0, 45.0, 50.0, 24.0, 27.0, 13.0, 8.0, 8.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.125, -70.40625, -67.6875, -64.96875, -62.25, -59.53125, -56.8125, -54.09375, -51.375, -48.65625, -45.9375, -43.21875, -40.5, -37.78125, -35.0625, -32.34375, -29.625, -26.90625, -24.1875, -21.46875, -18.75, -16.03125, -13.3125, -10.59375, -7.875, -5.15625, -2.4375, 0.28125, 3.0, 5.71875, 8.4375, 11.15625, 13.875, 16.59375, 19.3125, 22.03125, 24.75, 27.46875, 30.1875, 32.90625, 35.625, 38.34375, 41.0625, 43.78125, 46.5, 49.21875, 51.9375, 54.65625, 57.375, 60.09375, 62.8125, 65.53125, 68.25, 70.96875, 73.6875, 76.40625, 79.125, 81.84375, 84.5625, 87.28125, 90.0, 92.71875, 95.4375, 98.15625, 100.875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 7.0, 6.0, 16.0, 22.0, 25.0, 61.0, 104.0, 192.0, 216.0, 159.0, 71.0, 37.0, 22.0, 14.0, 10.0, 9.0, 13.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0155792236328125, -0.014987468719482422, -0.014395713806152344, -0.013803958892822266, -0.013212203979492188, -0.01262044906616211, -0.012028694152832031, -0.011436939239501953, -0.010845184326171875, -0.010253429412841797, -0.009661674499511719, -0.00906991958618164, -0.008478164672851562, -0.007886409759521484, -0.007294654846191406, -0.006702899932861328, -0.00611114501953125, -0.005519390106201172, -0.004927635192871094, -0.004335880279541016, -0.0037441253662109375, -0.0031523704528808594, -0.0025606155395507812, -0.001968860626220703, -0.001377105712890625, -0.0007853507995605469, -0.00019359588623046875, 0.0003981590270996094, 0.0009899139404296875, 0.0015816688537597656, 0.0021734237670898438, 0.002765178680419922, 0.00335693359375, 0.003948688507080078, 0.004540443420410156, 0.005132198333740234, 0.0057239532470703125, 0.006315708160400391, 0.006907463073730469, 0.007499217987060547, 0.008090972900390625, 0.008682727813720703, 0.009274482727050781, 0.00986623764038086, 0.010457992553710938, 0.011049747467041016, 0.011641502380371094, 0.012233257293701172, 0.01282501220703125, 0.013416767120361328, 0.014008522033691406, 0.014600276947021484, 0.015192031860351562, 0.01578378677368164, 0.01637554168701172, 0.016967296600341797, 0.017559051513671875, 0.018150806427001953, 0.01874256134033203, 0.01933431625366211, 0.019926071166992188, 0.020517826080322266, 0.021109580993652344, 0.021701335906982422, 0.0222930908203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 17.0, 20.0, 42.0, 63.0, 92.0, 145.0, 195.0, 384.0, 813.0, 1713.0, 4588.0, 17902.0, 167810.0, 773531.0, 64947.0, 10360.0, 3176.0, 1266.0, 612.0, 300.0, 202.0, 109.0, 78.0, 48.0, 34.0, 20.0, 14.0, 13.0, 4.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-72.4375, -70.38671875, -68.3359375, -66.28515625, -64.234375, -62.18359375, -60.1328125, -58.08203125, -56.03125, -53.98046875, -51.9296875, -49.87890625, -47.828125, -45.77734375, -43.7265625, -41.67578125, -39.625, -37.57421875, -35.5234375, -33.47265625, -31.421875, -29.37109375, -27.3203125, -25.26953125, -23.21875, -21.16796875, -19.1171875, -17.06640625, -15.015625, -12.96484375, -10.9140625, -8.86328125, -6.8125, -4.76171875, -2.7109375, -0.66015625, 1.390625, 3.44140625, 5.4921875, 7.54296875, 9.59375, 11.64453125, 13.6953125, 15.74609375, 17.796875, 19.84765625, 21.8984375, 23.94921875, 26.0, 28.05078125, 30.1015625, 32.15234375, 34.203125, 36.25390625, 38.3046875, 40.35546875, 42.40625, 44.45703125, 46.5078125, 48.55859375, 50.609375, 52.66015625, 54.7109375, 56.76171875, 58.8125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 13.0, 31.0, 41.0, 54.0, 88.0, 120.0, 135.0, 143.0, 111.0, 87.0, 44.0, 31.0, 27.0, 15.0, 8.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.75, -62.94580078125, -61.1416015625, -59.33740234375, -57.533203125, -55.72900390625, -53.9248046875, -52.12060546875, -50.31640625, -48.51220703125, -46.7080078125, -44.90380859375, -43.099609375, -41.29541015625, -39.4912109375, -37.68701171875, -35.8828125, -34.07861328125, -32.2744140625, -30.47021484375, -28.666015625, -26.86181640625, -25.0576171875, -23.25341796875, -21.44921875, -19.64501953125, -17.8408203125, -16.03662109375, -14.232421875, -12.42822265625, -10.6240234375, -8.81982421875, -7.015625, -5.21142578125, -3.4072265625, -1.60302734375, 0.201171875, 2.00537109375, 3.8095703125, 5.61376953125, 7.41796875, 9.22216796875, 11.0263671875, 12.83056640625, 14.634765625, 16.43896484375, 18.2431640625, 20.04736328125, 21.8515625, 23.65576171875, 25.4599609375, 27.26416015625, 29.068359375, 30.87255859375, 32.6767578125, 34.48095703125, 36.28515625, 38.08935546875, 39.8935546875, 41.69775390625, 43.501953125, 45.30615234375, 47.1103515625, 48.91455078125, 50.71875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 10.0, 16.0, 15.0, 18.0, 36.0, 44.0, 43.0, 51.0, 98.0, 95.0, 101.0, 91.0, 92.0, 78.0, 63.0, 46.0, 34.0, 21.0, 13.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-396.11224365234375, -376.8864440917969, -357.66064453125, -338.4348449707031, -319.20904541015625, -299.9832763671875, -280.7574768066406, -261.53167724609375, -242.30587768554688, -223.080078125, -203.85427856445312, -184.6284942626953, -165.40269470214844, -146.17689514160156, -126.95110321044922, -107.72531127929688, -88.49951171875, -69.27371215820312, -50.04792022705078, -30.822124481201172, -11.596328735351562, 7.6294708251953125, 26.855262756347656, 46.0810546875, 65.30685424804688, 84.53265380859375, 103.7584457397461, 122.98423767089844, 142.2100372314453, 161.4358367919922, 180.66162109375, 199.88742065429688, 219.1131591796875, 238.33895874023438, 257.56475830078125, 276.7905578613281, 296.016357421875, 315.24212646484375, 334.4679260253906, 353.6937255859375, 372.9195251464844, 392.14532470703125, 411.3711242675781, 430.596923828125, 449.82269287109375, 469.04852294921875, 488.2742919921875, 507.5000915527344, 526.7258911132812, 545.95166015625, 565.177490234375, 584.4032592773438, 603.6290893554688, 622.8548583984375, 642.0806884765625, 661.3064575195312, 680.5322265625, 699.7579956054688, 718.9838256835938, 738.2095947265625, 757.4354248046875, 776.6611938476562, 795.8870239257812, 815.11279296875, 834.338623046875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 5.0, 8.0, 2.0, 9.0, 8.0, 10.0, 16.0, 12.0, 13.0, 29.0, 23.0, 20.0, 30.0, 29.0, 42.0, 54.0, 62.0, 55.0, 62.0, 63.0, 51.0, 41.0, 45.0, 37.0, 39.0, 32.0, 29.0, 33.0, 32.0, 18.0, 20.0, 21.0, 6.0, 10.0, 10.0, 11.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-692.869384765625, -673.8358764648438, -654.8023681640625, -635.7688598632812, -616.7353515625, -597.7017822265625, -578.6682739257812, -559.634765625, -540.6012573242188, -521.5677490234375, -502.53424072265625, -483.5007019042969, -464.4671936035156, -445.4336853027344, -426.400146484375, -407.36663818359375, -388.3331298828125, -369.29962158203125, -350.26611328125, -331.2325744628906, -312.1990661621094, -293.1655578613281, -274.13201904296875, -255.0985107421875, -236.06500244140625, -217.031494140625, -197.9979705810547, -178.96444702148438, -159.93093872070312, -140.89743041992188, -121.86390686035156, -102.83038330078125, -83.79693603515625, -64.76342010498047, -45.72990417480469, -26.696388244628906, -7.662872314453125, 11.370643615722656, 30.404159545898438, 49.43768310546875, 68.47119140625, 87.50470733642578, 106.53822326660156, 125.57173919677734, 144.60525512695312, 163.63876342773438, 182.6722869873047, 201.705810546875, 220.73931884765625, 239.7728271484375, 258.80633544921875, 277.8398742675781, 296.8733825683594, 315.9068908691406, 334.9404296875, 353.97393798828125, 373.0074462890625, 392.04095458984375, 411.074462890625, 430.1080017089844, 449.1415100097656, 468.1750183105469, 487.20855712890625, 506.2420654296875, 525.2755737304688]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 10.0, 5.0, 13.0, 15.0, 15.0, 35.0, 26.0, 41.0, 51.0, 76.0, 92.0, 143.0, 216.0, 303.0, 408.0, 613.0, 886.0, 1517.0, 3404.0, 4144988.0, 34143.0, 3026.0, 1384.0, 912.0, 586.0, 386.0, 272.0, 223.0, 139.0, 96.0, 64.0, 49.0, 46.0, 36.0, 21.0, 12.0, 8.0, 7.0, 4.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.875, -201.564453125, -195.25390625, -188.943359375, -182.6328125, -176.322265625, -170.01171875, -163.701171875, -157.390625, -151.080078125, -144.76953125, -138.458984375, -132.1484375, -125.837890625, -119.52734375, -113.216796875, -106.90625, -100.595703125, -94.28515625, -87.974609375, -81.6640625, -75.353515625, -69.04296875, -62.732421875, -56.421875, -50.111328125, -43.80078125, -37.490234375, -31.1796875, -24.869140625, -18.55859375, -12.248046875, -5.9375, 0.373046875, 6.68359375, 12.994140625, 19.3046875, 25.615234375, 31.92578125, 38.236328125, 44.546875, 50.857421875, 57.16796875, 63.478515625, 69.7890625, 76.099609375, 82.41015625, 88.720703125, 95.03125, 101.341796875, 107.65234375, 113.962890625, 120.2734375, 126.583984375, 132.89453125, 139.205078125, 145.515625, 151.826171875, 158.13671875, 164.447265625, 170.7578125, 177.068359375, 183.37890625, 189.689453125, 196.0]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 7.0, 3.0, 8.0, 10.0, 6.0, 7.0, 12.0, 15.0, 16.0, 15.0, 19.0, 27.0, 26.0, 37.0, 55.0, 47.0, 43.0, 52.0, 49.0, 57.0, 58.0, 48.0, 59.0, 43.0, 44.0, 39.0, 29.0, 32.0, 26.0, 21.0, 21.0, 14.0, 12.0, 12.0, 8.0, 9.0, 2.0, 8.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.140625, -24.371337890625, -23.60205078125, -22.832763671875, -22.0634765625, -21.294189453125, -20.52490234375, -19.755615234375, -18.986328125, -18.217041015625, -17.44775390625, -16.678466796875, -15.9091796875, -15.139892578125, -14.37060546875, -13.601318359375, -12.83203125, -12.062744140625, -11.29345703125, -10.524169921875, -9.7548828125, -8.985595703125, -8.21630859375, -7.447021484375, -6.677734375, -5.908447265625, -5.13916015625, -4.369873046875, -3.6005859375, -2.831298828125, -2.06201171875, -1.292724609375, -0.5234375, 0.245849609375, 1.01513671875, 1.784423828125, 2.5537109375, 3.322998046875, 4.09228515625, 4.861572265625, 5.630859375, 6.400146484375, 7.16943359375, 7.938720703125, 8.7080078125, 9.477294921875, 10.24658203125, 11.015869140625, 11.78515625, 12.554443359375, 13.32373046875, 14.093017578125, 14.8623046875, 15.631591796875, 16.40087890625, 17.170166015625, 17.939453125, 18.708740234375, 19.47802734375, 20.247314453125, 21.0166015625, 21.785888671875, 22.55517578125, 23.324462890625, 24.09375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 15.0, 12.0, 22.0, 30.0, 34.0, 48.0, 69.0, 103.0, 154.0, 294.0, 551.0, 1736.0, 4138771.0, 49561.0, 1542.0, 545.0, 271.0, 161.0, 104.0, 76.0, 37.0, 33.0, 28.0, 19.0, 15.0, 7.0, 11.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-543.0, -522.859375, -502.71875, -482.578125, -462.4375, -442.296875, -422.15625, -402.015625, -381.875, -361.734375, -341.59375, -321.453125, -301.3125, -281.171875, -261.03125, -240.890625, -220.75, -200.609375, -180.46875, -160.328125, -140.1875, -120.046875, -99.90625, -79.765625, -59.625, -39.484375, -19.34375, 0.796875, 20.9375, 41.078125, 61.21875, 81.359375, 101.5, 121.640625, 141.78125, 161.921875, 182.0625, 202.203125, 222.34375, 242.484375, 262.625, 282.765625, 302.90625, 323.046875, 343.1875, 363.328125, 383.46875, 403.609375, 423.75, 443.890625, 464.03125, 484.171875, 504.3125, 524.453125, 544.59375, 564.734375, 584.875, 605.015625, 625.15625, 645.296875, 665.4375, 685.578125, 705.71875, 725.859375, 746.0]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 3915.0, 140.0, 11.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-147.125, -143.701171875, -140.27734375, -136.853515625, -133.4296875, -130.005859375, -126.58203125, -123.158203125, -119.734375, -116.310546875, -112.88671875, -109.462890625, -106.0390625, -102.615234375, -99.19140625, -95.767578125, -92.34375, -88.919921875, -85.49609375, -82.072265625, -78.6484375, -75.224609375, -71.80078125, -68.376953125, -64.953125, -61.529296875, -58.10546875, -54.681640625, -51.2578125, -47.833984375, -44.41015625, -40.986328125, -37.5625, -34.138671875, -30.71484375, -27.291015625, -23.8671875, -20.443359375, -17.01953125, -13.595703125, -10.171875, -6.748046875, -3.32421875, 0.099609375, 3.5234375, 6.947265625, 10.37109375, 13.794921875, 17.21875, 20.642578125, 24.06640625, 27.490234375, 30.9140625, 34.337890625, 37.76171875, 41.185546875, 44.609375, 48.033203125, 51.45703125, 54.880859375, 58.3046875, 61.728515625, 65.15234375, 68.576171875, 72.0]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 5.0, 6.0, 17.0, 19.0, 32.0, 48.0, 43.0, 86.0, 114.0, 133.0, 130.0, 99.0, 66.0, 48.0, 42.0, 22.0, 22.0, 10.0, 11.0, 8.0, 6.0, 10.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-222.56886291503906, -217.20550537109375, -211.84214782714844, -206.47879028320312, -201.1154327392578, -195.7520751953125, -190.38870239257812, -185.0253448486328, -179.6619873046875, -174.2986297607422, -168.93527221679688, -163.57191467285156, -158.20855712890625, -152.84518432617188, -147.48184204101562, -142.11846923828125, -136.755126953125, -131.3917694091797, -126.02841186523438, -120.66505432128906, -115.30168914794922, -109.9383316040039, -104.5749740600586, -99.21160888671875, -93.84825134277344, -88.48489379882812, -83.12153625488281, -77.7581787109375, -72.39481353759766, -67.03145599365234, -61.66809844970703, -56.30473709106445, -50.941368103027344, -45.57801055908203, -40.21464920043945, -34.85129165649414, -29.487932205200195, -24.12457275390625, -18.761215209960938, -13.39785385131836, -8.034496307373047, -2.6711373329162598, 2.6922216415405273, 8.055580139160156, 13.418939590454102, 18.782299041748047, 24.14565658569336, 29.509017944335938, 34.87237548828125, 40.23573303222656, 45.59909439086914, 50.96245193481445, 56.32581329345703, 61.689170837402344, 67.05252838134766, 72.4158935546875, 77.77925109863281, 83.14260864257812, 88.50596618652344, 93.86932373046875, 99.2326889038086, 104.5960464477539, 109.95940399169922, 115.32276916503906, 120.68611907958984]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 11.0, 8.0, 9.0, 13.0, 16.0, 18.0, 23.0, 26.0, 19.0, 41.0, 37.0, 38.0, 31.0, 42.0, 24.0, 45.0, 46.0, 45.0, 31.0, 43.0, 42.0, 41.0, 35.0, 42.0, 42.0, 35.0, 35.0, 21.0, 15.0, 25.0, 19.0, 14.0, 13.0, 6.0, 16.0, 9.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-97.53889465332031, -94.59437561035156, -91.64986419677734, -88.70535278320312, -85.76083374023438, -82.81631469726562, -79.8718032836914, -76.92729187011719, -73.98277282714844, -71.03825378417969, -68.09374237060547, -65.14923095703125, -62.2047119140625, -59.260196685791016, -56.31568145751953, -53.37116622924805, -50.42665100097656, -47.48213577270508, -44.537620544433594, -41.59310531616211, -38.648590087890625, -35.70407485961914, -32.759559631347656, -29.815044403076172, -26.870529174804688, -23.926013946533203, -20.98149871826172, -18.036983489990234, -15.09246826171875, -12.147953033447266, -9.203437805175781, -6.258922576904297, -3.3144149780273438, -0.3698997497558594, 2.574615478515625, 5.519130706787109, 8.463645935058594, 11.408161163330078, 14.352676391601562, 17.297191619873047, 20.24170684814453, 23.186222076416016, 26.1307373046875, 29.075252532958984, 32.01976776123047, 34.96428298950195, 37.90879821777344, 40.85331344604492, 43.797828674316406, 46.74234390258789, 49.686859130859375, 52.63137435913086, 55.575889587402344, 58.52040481567383, 61.46492004394531, 64.40943908691406, 67.35395050048828, 70.2984619140625, 73.24298095703125, 76.1875, 79.13201141357422, 82.07652282714844, 85.02104187011719, 87.96556091308594, 90.91007232666016]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 9.0, 8.0, 8.0, 13.0, 12.0, 29.0, 36.0, 40.0, 83.0, 120.0, 168.0, 260.0, 455.0, 656.0, 1120.0, 1944.0, 3521.0, 7036.0, 14993.0, 36168.0, 104460.0, 436203.0, 308132.0, 78669.0, 28624.0, 12394.0, 5929.0, 3082.0, 1730.0, 1012.0, 581.0, 370.0, 228.0, 148.0, 119.0, 75.0, 41.0, 25.0, 16.0, 12.0, 13.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.6875, -67.2744140625, -64.861328125, -62.4482421875, -60.03515625, -57.6220703125, -55.208984375, -52.7958984375, -50.3828125, -47.9697265625, -45.556640625, -43.1435546875, -40.73046875, -38.3173828125, -35.904296875, -33.4912109375, -31.078125, -28.6650390625, -26.251953125, -23.8388671875, -21.42578125, -19.0126953125, -16.599609375, -14.1865234375, -11.7734375, -9.3603515625, -6.947265625, -4.5341796875, -2.12109375, 0.2919921875, 2.705078125, 5.1181640625, 7.53125, 9.9443359375, 12.357421875, 14.7705078125, 17.18359375, 19.5966796875, 22.009765625, 24.4228515625, 26.8359375, 29.2490234375, 31.662109375, 34.0751953125, 36.48828125, 38.9013671875, 41.314453125, 43.7275390625, 46.140625, 48.5537109375, 50.966796875, 53.3798828125, 55.79296875, 58.2060546875, 60.619140625, 63.0322265625, 65.4453125, 67.8583984375, 70.271484375, 72.6845703125, 75.09765625, 77.5107421875, 79.923828125, 82.3369140625, 84.75]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 5.0, 15.0, 13.0, 22.0, 18.0, 28.0, 22.0, 26.0, 32.0, 47.0, 47.0, 39.0, 46.0, 59.0, 49.0, 60.0, 67.0, 54.0, 39.0, 52.0, 24.0, 32.0, 38.0, 21.0, 26.0, 10.0, 21.0, 16.0, 15.0, 5.0, 7.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.6875, -29.68994140625, -28.6923828125, -27.69482421875, -26.697265625, -25.69970703125, -24.7021484375, -23.70458984375, -22.70703125, -21.70947265625, -20.7119140625, -19.71435546875, -18.716796875, -17.71923828125, -16.7216796875, -15.72412109375, -14.7265625, -13.72900390625, -12.7314453125, -11.73388671875, -10.736328125, -9.73876953125, -8.7412109375, -7.74365234375, -6.74609375, -5.74853515625, -4.7509765625, -3.75341796875, -2.755859375, -1.75830078125, -0.7607421875, 0.23681640625, 1.234375, 2.23193359375, 3.2294921875, 4.22705078125, 5.224609375, 6.22216796875, 7.2197265625, 8.21728515625, 9.21484375, 10.21240234375, 11.2099609375, 12.20751953125, 13.205078125, 14.20263671875, 15.2001953125, 16.19775390625, 17.1953125, 18.19287109375, 19.1904296875, 20.18798828125, 21.185546875, 22.18310546875, 23.1806640625, 24.17822265625, 25.17578125, 26.17333984375, 27.1708984375, 28.16845703125, 29.166015625, 30.16357421875, 31.1611328125, 32.15869140625, 33.15625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 8.0, 13.0, 12.0, 17.0, 25.0, 29.0, 37.0, 62.0, 89.0, 155.0, 264.0, 549.0, 926.0, 1937.0, 4807.0, 15551.0, 73487.0, 655937.0, 245219.0, 34374.0, 8898.0, 3110.0, 1382.0, 672.0, 351.0, 225.0, 134.0, 89.0, 60.0, 35.0, 24.0, 21.0, 19.0, 11.0, 3.0, 4.0, 7.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-115.875, -112.4443359375, -109.013671875, -105.5830078125, -102.15234375, -98.7216796875, -95.291015625, -91.8603515625, -88.4296875, -84.9990234375, -81.568359375, -78.1376953125, -74.70703125, -71.2763671875, -67.845703125, -64.4150390625, -60.984375, -57.5537109375, -54.123046875, -50.6923828125, -47.26171875, -43.8310546875, -40.400390625, -36.9697265625, -33.5390625, -30.1083984375, -26.677734375, -23.2470703125, -19.81640625, -16.3857421875, -12.955078125, -9.5244140625, -6.09375, -2.6630859375, 0.767578125, 4.1982421875, 7.62890625, 11.0595703125, 14.490234375, 17.9208984375, 21.3515625, 24.7822265625, 28.212890625, 31.6435546875, 35.07421875, 38.5048828125, 41.935546875, 45.3662109375, 48.796875, 52.2275390625, 55.658203125, 59.0888671875, 62.51953125, 65.9501953125, 69.380859375, 72.8115234375, 76.2421875, 79.6728515625, 83.103515625, 86.5341796875, 89.96484375, 93.3955078125, 96.826171875, 100.2568359375, 103.6875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 7.0, 1.0, 12.0, 15.0, 16.0, 12.0, 20.0, 28.0, 29.0, 35.0, 28.0, 32.0, 37.0, 36.0, 36.0, 45.0, 42.0, 46.0, 43.0, 39.0, 46.0, 41.0, 42.0, 35.0, 32.0, 45.0, 27.0, 25.0, 16.0, 20.0, 18.0, 12.0, 14.0, 14.0, 10.0, 6.0, 6.0, 1.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.5625, -110.857421875, -107.15234375, -103.447265625, -99.7421875, -96.037109375, -92.33203125, -88.626953125, -84.921875, -81.216796875, -77.51171875, -73.806640625, -70.1015625, -66.396484375, -62.69140625, -58.986328125, -55.28125, -51.576171875, -47.87109375, -44.166015625, -40.4609375, -36.755859375, -33.05078125, -29.345703125, -25.640625, -21.935546875, -18.23046875, -14.525390625, -10.8203125, -7.115234375, -3.41015625, 0.294921875, 4.0, 7.705078125, 11.41015625, 15.115234375, 18.8203125, 22.525390625, 26.23046875, 29.935546875, 33.640625, 37.345703125, 41.05078125, 44.755859375, 48.4609375, 52.166015625, 55.87109375, 59.576171875, 63.28125, 66.986328125, 70.69140625, 74.396484375, 78.1015625, 81.806640625, 85.51171875, 89.216796875, 92.921875, 96.626953125, 100.33203125, 104.037109375, 107.7421875, 111.447265625, 115.15234375, 118.857421875, 122.5625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 7.0, 7.0, 12.0, 13.0, 26.0, 17.0, 29.0, 59.0, 93.0, 225.0, 418.0, 1028.0, 2686.0, 9029.0, 46864.0, 627948.0, 318052.0, 31470.0, 6813.0, 2169.0, 768.0, 346.0, 183.0, 96.0, 62.0, 39.0, 27.0, 21.0, 12.0, 11.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.96875, -61.1640625, -59.359375, -57.5546875, -55.75, -53.9453125, -52.140625, -50.3359375, -48.53125, -46.7265625, -44.921875, -43.1171875, -41.3125, -39.5078125, -37.703125, -35.8984375, -34.09375, -32.2890625, -30.484375, -28.6796875, -26.875, -25.0703125, -23.265625, -21.4609375, -19.65625, -17.8515625, -16.046875, -14.2421875, -12.4375, -10.6328125, -8.828125, -7.0234375, -5.21875, -3.4140625, -1.609375, 0.1953125, 2.0, 3.8046875, 5.609375, 7.4140625, 9.21875, 11.0234375, 12.828125, 14.6328125, 16.4375, 18.2421875, 20.046875, 21.8515625, 23.65625, 25.4609375, 27.265625, 29.0703125, 30.875, 32.6796875, 34.484375, 36.2890625, 38.09375, 39.8984375, 41.703125, 43.5078125, 45.3125, 47.1171875, 48.921875, 50.7265625, 52.53125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 4.0, 3.0, 4.0, 9.0, 8.0, 21.0, 21.0, 52.0, 102.0, 161.0, 224.0, 168.0, 101.0, 43.0, 28.0, 17.0, 16.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008453369140625, -0.007940053939819336, -0.007426738739013672, -0.006913423538208008, -0.006400108337402344, -0.00588679313659668, -0.005373477935791016, -0.0048601627349853516, -0.0043468475341796875, -0.0038335323333740234, -0.0033202171325683594, -0.0028069019317626953, -0.0022935867309570312, -0.0017802715301513672, -0.0012669563293457031, -0.0007536411285400391, -0.000240325927734375, 0.00027298927307128906, 0.0007863044738769531, 0.0012996196746826172, 0.0018129348754882812, 0.0023262500762939453, 0.0028395652770996094, 0.0033528804779052734, 0.0038661956787109375, 0.0043795108795166016, 0.004892826080322266, 0.00540614128112793, 0.005919456481933594, 0.006432771682739258, 0.006946086883544922, 0.007459402084350586, 0.00797271728515625, 0.008486032485961914, 0.008999347686767578, 0.009512662887573242, 0.010025978088378906, 0.01053929328918457, 0.011052608489990234, 0.011565923690795898, 0.012079238891601562, 0.012592554092407227, 0.01310586929321289, 0.013619184494018555, 0.014132499694824219, 0.014645814895629883, 0.015159130096435547, 0.01567244529724121, 0.016185760498046875, 0.01669907569885254, 0.017212390899658203, 0.017725706100463867, 0.01823902130126953, 0.018752336502075195, 0.01926565170288086, 0.019778966903686523, 0.020292282104492188, 0.02080559730529785, 0.021318912506103516, 0.02183222770690918, 0.022345542907714844, 0.022858858108520508, 0.023372173309326172, 0.023885488510131836, 0.0243988037109375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 7.0, 11.0, 7.0, 16.0, 23.0, 30.0, 41.0, 57.0, 85.0, 171.0, 277.0, 595.0, 1451.0, 4780.0, 22783.0, 224477.0, 723785.0, 56615.0, 9112.0, 2385.0, 853.0, 413.0, 210.0, 116.0, 65.0, 56.0, 31.0, 34.0, 20.0, 14.0, 9.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.5625, -72.318359375, -70.07421875, -67.830078125, -65.5859375, -63.341796875, -61.09765625, -58.853515625, -56.609375, -54.365234375, -52.12109375, -49.876953125, -47.6328125, -45.388671875, -43.14453125, -40.900390625, -38.65625, -36.412109375, -34.16796875, -31.923828125, -29.6796875, -27.435546875, -25.19140625, -22.947265625, -20.703125, -18.458984375, -16.21484375, -13.970703125, -11.7265625, -9.482421875, -7.23828125, -4.994140625, -2.75, -0.505859375, 1.73828125, 3.982421875, 6.2265625, 8.470703125, 10.71484375, 12.958984375, 15.203125, 17.447265625, 19.69140625, 21.935546875, 24.1796875, 26.423828125, 28.66796875, 30.912109375, 33.15625, 35.400390625, 37.64453125, 39.888671875, 42.1328125, 44.376953125, 46.62109375, 48.865234375, 51.109375, 53.353515625, 55.59765625, 57.841796875, 60.0859375, 62.330078125, 64.57421875, 66.818359375, 69.0625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 12.0, 8.0, 12.0, 28.0, 31.0, 49.0, 58.0, 76.0, 124.0, 175.0, 138.0, 82.0, 69.0, 36.0, 34.0, 21.0, 17.0, 12.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84375, -50.58740234375, -48.3310546875, -46.07470703125, -43.818359375, -41.56201171875, -39.3056640625, -37.04931640625, -34.79296875, -32.53662109375, -30.2802734375, -28.02392578125, -25.767578125, -23.51123046875, -21.2548828125, -18.99853515625, -16.7421875, -14.48583984375, -12.2294921875, -9.97314453125, -7.716796875, -5.46044921875, -3.2041015625, -0.94775390625, 1.30859375, 3.56494140625, 5.8212890625, 8.07763671875, 10.333984375, 12.59033203125, 14.8466796875, 17.10302734375, 19.359375, 21.61572265625, 23.8720703125, 26.12841796875, 28.384765625, 30.64111328125, 32.8974609375, 35.15380859375, 37.41015625, 39.66650390625, 41.9228515625, 44.17919921875, 46.435546875, 48.69189453125, 50.9482421875, 53.20458984375, 55.4609375, 57.71728515625, 59.9736328125, 62.22998046875, 64.486328125, 66.74267578125, 68.9990234375, 71.25537109375, 73.51171875, 75.76806640625, 78.0244140625, 80.28076171875, 82.537109375, 84.79345703125, 87.0498046875, 89.30615234375, 91.5625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 17.0, 18.0, 64.0, 118.0, 210.0, 243.0, 153.0, 82.0, 43.0, 20.0, 11.0, 9.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-997.660888671875, -950.6033935546875, -903.5459594726562, -856.488525390625, -809.4310302734375, -762.37353515625, -715.3161010742188, -668.2586669921875, -621.201171875, -574.1436767578125, -527.0862426757812, -480.0287780761719, -432.9713134765625, -385.9138488769531, -338.85638427734375, -291.7989196777344, -244.741455078125, -197.68399047851562, -150.62652587890625, -103.56906127929688, -56.5115966796875, -9.454132080078125, 37.60333251953125, 84.66079711914062, 131.71826171875, 178.77572631835938, 225.83319091796875, 272.8906555175781, 319.9481201171875, 367.0055847167969, 414.06304931640625, 461.1205139160156, 508.177978515625, 555.2354736328125, 602.2929077148438, 649.350341796875, 696.4078369140625, 743.46533203125, 790.5227661132812, 837.5802001953125, 884.6376953125, 931.6951904296875, 978.7526245117188, 1025.81005859375, 1072.8675537109375, 1119.925048828125, 1166.982421875, 1214.0399169921875, 1261.097412109375, 1308.1549072265625, 1355.21240234375, 1402.269775390625, 1449.3272705078125, 1496.384765625, 1543.442138671875, 1590.4996337890625, 1637.55712890625, 1684.6146240234375, 1731.672119140625, 1778.7294921875, 1825.7869873046875, 1872.844482421875, 1919.90185546875, 1966.9593505859375, 2014.016845703125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 9.0, 5.0, 11.0, 17.0, 16.0, 16.0, 22.0, 29.0, 46.0, 38.0, 35.0, 51.0, 54.0, 55.0, 74.0, 53.0, 57.0, 51.0, 51.0, 51.0, 35.0, 41.0, 30.0, 28.0, 19.0, 14.0, 17.0, 14.0, 15.0, 12.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-650.7698364257812, -627.1006469726562, -603.4314575195312, -579.76220703125, -556.093017578125, -532.423828125, -508.754638671875, -485.08544921875, -461.416259765625, -437.7470703125, -414.0778503417969, -390.4086608886719, -366.7394714355469, -343.07025146484375, -319.40106201171875, -295.73187255859375, -272.0626525878906, -248.39344787597656, -224.72425842285156, -201.0550537109375, -177.3858642578125, -153.71665954589844, -130.04745483398438, -106.37826538085938, -82.70906066894531, -59.03986358642578, -35.370662689208984, -11.701461791992188, 11.967735290527344, 35.636932373046875, 59.30613708496094, 82.97532653808594, 106.64453125, 130.31373596191406, 153.98292541503906, 177.65213012695312, 201.32131958007812, 224.9905242919922, 248.65972900390625, 272.32891845703125, 295.99810791015625, 319.66729736328125, 343.3365173339844, 367.0057067871094, 390.6748962402344, 414.3441162109375, 438.0133056640625, 461.6824951171875, 485.3517150878906, 509.0209045410156, 532.6901245117188, 556.3593139648438, 580.0285034179688, 603.6976928710938, 627.366943359375, 651.0361328125, 674.705322265625, 698.37451171875, 722.043701171875, 745.712890625, 769.3821411132812, 793.0513305664062, 816.7205200195312, 840.3897094726562, 864.0588989257812]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 7.0, 1.0, 9.0, 9.0, 18.0, 14.0, 21.0, 30.0, 48.0, 62.0, 99.0, 123.0, 166.0, 310.0, 427.0, 631.0, 984.0, 1486.0, 2689.0, 5530.0, 23555.0, 4129707.0, 17038.0, 4707.0, 2421.0, 1419.0, 900.0, 601.0, 392.0, 276.0, 176.0, 131.0, 93.0, 50.0, 47.0, 37.0, 22.0, 18.0, 12.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.875, -151.71875, -146.5625, -141.40625, -136.25, -131.09375, -125.9375, -120.78125, -115.625, -110.46875, -105.3125, -100.15625, -95.0, -89.84375, -84.6875, -79.53125, -74.375, -69.21875, -64.0625, -58.90625, -53.75, -48.59375, -43.4375, -38.28125, -33.125, -27.96875, -22.8125, -17.65625, -12.5, -7.34375, -2.1875, 2.96875, 8.125, 13.28125, 18.4375, 23.59375, 28.75, 33.90625, 39.0625, 44.21875, 49.375, 54.53125, 59.6875, 64.84375, 70.0, 75.15625, 80.3125, 85.46875, 90.625, 95.78125, 100.9375, 106.09375, 111.25, 116.40625, 121.5625, 126.71875, 131.875, 137.03125, 142.1875, 147.34375, 152.5, 157.65625, 162.8125, 167.96875, 173.125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 7.0, 14.0, 28.0, 28.0, 23.0, 38.0, 56.0, 65.0, 60.0, 73.0, 69.0, 82.0, 84.0, 63.0, 65.0, 59.0, 33.0, 38.0, 21.0, 13.0, 12.0, 16.0, 14.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-50.84375, -49.47705078125, -48.1103515625, -46.74365234375, -45.376953125, -44.01025390625, -42.6435546875, -41.27685546875, -39.91015625, -38.54345703125, -37.1767578125, -35.81005859375, -34.443359375, -33.07666015625, -31.7099609375, -30.34326171875, -28.9765625, -27.60986328125, -26.2431640625, -24.87646484375, -23.509765625, -22.14306640625, -20.7763671875, -19.40966796875, -18.04296875, -16.67626953125, -15.3095703125, -13.94287109375, -12.576171875, -11.20947265625, -9.8427734375, -8.47607421875, -7.109375, -5.74267578125, -4.3759765625, -3.00927734375, -1.642578125, -0.27587890625, 1.0908203125, 2.45751953125, 3.82421875, 5.19091796875, 6.5576171875, 7.92431640625, 9.291015625, 10.65771484375, 12.0244140625, 13.39111328125, 14.7578125, 16.12451171875, 17.4912109375, 18.85791015625, 20.224609375, 21.59130859375, 22.9580078125, 24.32470703125, 25.69140625, 27.05810546875, 28.4248046875, 29.79150390625, 31.158203125, 32.52490234375, 33.8916015625, 35.25830078125, 36.625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 19.0, 13.0, 25.0, 39.0, 49.0, 62.0, 136.0, 160.0, 237.0, 348.0, 527.0, 973.0, 1594.0, 3073.0, 7426.0, 42505.0, 4103301.0, 21736.0, 5681.0, 2643.0, 1387.0, 791.0, 500.0, 303.0, 239.0, 153.0, 105.0, 84.0, 48.0, 29.0, 32.0, 21.0, 8.0, 8.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-204.75, -198.79296875, -192.8359375, -186.87890625, -180.921875, -174.96484375, -169.0078125, -163.05078125, -157.09375, -151.13671875, -145.1796875, -139.22265625, -133.265625, -127.30859375, -121.3515625, -115.39453125, -109.4375, -103.48046875, -97.5234375, -91.56640625, -85.609375, -79.65234375, -73.6953125, -67.73828125, -61.78125, -55.82421875, -49.8671875, -43.91015625, -37.953125, -31.99609375, -26.0390625, -20.08203125, -14.125, -8.16796875, -2.2109375, 3.74609375, 9.703125, 15.66015625, 21.6171875, 27.57421875, 33.53125, 39.48828125, 45.4453125, 51.40234375, 57.359375, 63.31640625, 69.2734375, 75.23046875, 81.1875, 87.14453125, 93.1015625, 99.05859375, 105.015625, 110.97265625, 116.9296875, 122.88671875, 128.84375, 134.80078125, 140.7578125, 146.71484375, 152.671875, 158.62890625, 164.5859375, 170.54296875, 176.5]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 8.0, 9.0, 17.0, 16.0, 45.0, 167.0, 3643.0, 101.0, 24.0, 15.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.9375, -59.7529296875, -57.568359375, -55.3837890625, -53.19921875, -51.0146484375, -48.830078125, -46.6455078125, -44.4609375, -42.2763671875, -40.091796875, -37.9072265625, -35.72265625, -33.5380859375, -31.353515625, -29.1689453125, -26.984375, -24.7998046875, -22.615234375, -20.4306640625, -18.24609375, -16.0615234375, -13.876953125, -11.6923828125, -9.5078125, -7.3232421875, -5.138671875, -2.9541015625, -0.76953125, 1.4150390625, 3.599609375, 5.7841796875, 7.96875, 10.1533203125, 12.337890625, 14.5224609375, 16.70703125, 18.8916015625, 21.076171875, 23.2607421875, 25.4453125, 27.6298828125, 29.814453125, 31.9990234375, 34.18359375, 36.3681640625, 38.552734375, 40.7373046875, 42.921875, 45.1064453125, 47.291015625, 49.4755859375, 51.66015625, 53.8447265625, 56.029296875, 58.2138671875, 60.3984375, 62.5830078125, 64.767578125, 66.9521484375, 69.13671875, 71.3212890625, 73.505859375, 75.6904296875, 77.875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 12.0, 16.0, 20.0, 39.0, 63.0, 92.0, 139.0, 163.0, 148.0, 98.0, 77.0, 39.0, 22.0, 17.0, 11.0, 9.0, 4.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.9148712158203, -219.68553161621094, -211.45620727539062, -203.22686767578125, -194.99752807617188, -186.7681884765625, -178.5388641357422, -170.3095245361328, -162.0802001953125, -153.85086059570312, -145.6215362548828, -137.39219665527344, -129.16285705566406, -120.93352508544922, -112.70419311523438, -104.474853515625, -96.24551391601562, -88.01618194580078, -79.7868423461914, -71.55751037597656, -63.32817459106445, -55.098838806152344, -46.8695068359375, -38.64017105102539, -30.41083526611328, -22.181499481201172, -13.952165603637695, -5.722831726074219, 2.5065040588378906, 10.73583984375, 18.965171813964844, 27.194507598876953, 35.423858642578125, 43.653194427490234, 51.882530212402344, 60.11186218261719, 68.34120178222656, 76.5705337524414, 84.79986572265625, 93.02920532226562, 101.25853729248047, 109.48786926269531, 117.71720886230469, 125.94654083251953, 134.17587280273438, 142.40521240234375, 150.63455200195312, 158.86387634277344, 167.0932159423828, 175.3225555419922, 183.5518798828125, 191.78121948242188, 200.01055908203125, 208.23989868164062, 216.46922302246094, 224.6985626220703, 232.92788696289062, 241.1572265625, 249.3865509033203, 257.61590576171875, 265.84521484375, 274.0745544433594, 282.30389404296875, 290.5332336425781, 298.7625732421875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 9.0, 8.0, 7.0, 7.0, 14.0, 10.0, 15.0, 15.0, 23.0, 27.0, 29.0, 23.0, 35.0, 28.0, 44.0, 40.0, 42.0, 35.0, 41.0, 50.0, 45.0, 42.0, 34.0, 43.0, 32.0, 38.0, 20.0, 26.0, 39.0, 23.0, 27.0, 24.0, 15.0, 12.0, 12.0, 9.0, 17.0, 8.0, 6.0, 7.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-113.14628601074219, -109.76753997802734, -106.3887939453125, -103.01004791259766, -99.63130187988281, -96.25255584716797, -92.87380981445312, -89.49507141113281, -86.11631774902344, -82.7375717163086, -79.35882568359375, -75.9800796508789, -72.60133361816406, -69.22258758544922, -65.84384155273438, -62.4650993347168, -59.08635711669922, -55.707611083984375, -52.32886505126953, -48.95011901855469, -45.571372985839844, -42.192626953125, -38.81388473510742, -35.43513870239258, -32.056392669677734, -28.67764663696289, -25.298900604248047, -21.920156478881836, -18.541410446166992, -15.162664413452148, -11.783920288085938, -8.405174255371094, -5.02642822265625, -1.6476826667785645, 1.731062889099121, 5.109807968139648, 8.488554000854492, 11.867300033569336, 15.246044158935547, 18.62479019165039, 22.003536224365234, 25.382282257080078, 28.761028289794922, 32.1397705078125, 35.518516540527344, 38.89726257324219, 42.27600860595703, 45.654754638671875, 49.03350067138672, 52.41224670410156, 55.790992736816406, 59.16973876953125, 62.548484802246094, 65.92723083496094, 69.30596923828125, 72.68472290039062, 76.06346130371094, 79.44220733642578, 82.82095336914062, 86.19969940185547, 89.57844543457031, 92.95719146728516, 96.3359375, 99.71467590332031, 103.09342956542969]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 0.0, 4.0, 1.0, 8.0, 8.0, 10.0, 7.0, 21.0, 26.0, 46.0, 68.0, 114.0, 132.0, 246.0, 402.0, 577.0, 1010.0, 1768.0, 3204.0, 6171.0, 13491.0, 31657.0, 85384.0, 290007.0, 418524.0, 119461.0, 42063.0, 17301.0, 7821.0, 3927.0, 2047.0, 1157.0, 688.0, 405.0, 266.0, 191.0, 102.0, 67.0, 51.0, 33.0, 29.0, 21.0, 9.0, 12.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.0, -84.20703125, -81.4140625, -78.62109375, -75.828125, -73.03515625, -70.2421875, -67.44921875, -64.65625, -61.86328125, -59.0703125, -56.27734375, -53.484375, -50.69140625, -47.8984375, -45.10546875, -42.3125, -39.51953125, -36.7265625, -33.93359375, -31.140625, -28.34765625, -25.5546875, -22.76171875, -19.96875, -17.17578125, -14.3828125, -11.58984375, -8.796875, -6.00390625, -3.2109375, -0.41796875, 2.375, 5.16796875, 7.9609375, 10.75390625, 13.546875, 16.33984375, 19.1328125, 21.92578125, 24.71875, 27.51171875, 30.3046875, 33.09765625, 35.890625, 38.68359375, 41.4765625, 44.26953125, 47.0625, 49.85546875, 52.6484375, 55.44140625, 58.234375, 61.02734375, 63.8203125, 66.61328125, 69.40625, 72.19921875, 74.9921875, 77.78515625, 80.578125, 83.37109375, 86.1640625, 88.95703125, 91.75]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 5.0, 7.0, 11.0, 19.0, 17.0, 21.0, 27.0, 38.0, 28.0, 46.0, 68.0, 70.0, 77.0, 70.0, 69.0, 67.0, 73.0, 64.0, 37.0, 42.0, 25.0, 22.0, 22.0, 15.0, 16.0, 16.0, 10.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.96875, -43.560546875, -42.15234375, -40.744140625, -39.3359375, -37.927734375, -36.51953125, -35.111328125, -33.703125, -32.294921875, -30.88671875, -29.478515625, -28.0703125, -26.662109375, -25.25390625, -23.845703125, -22.4375, -21.029296875, -19.62109375, -18.212890625, -16.8046875, -15.396484375, -13.98828125, -12.580078125, -11.171875, -9.763671875, -8.35546875, -6.947265625, -5.5390625, -4.130859375, -2.72265625, -1.314453125, 0.09375, 1.501953125, 2.91015625, 4.318359375, 5.7265625, 7.134765625, 8.54296875, 9.951171875, 11.359375, 12.767578125, 14.17578125, 15.583984375, 16.9921875, 18.400390625, 19.80859375, 21.216796875, 22.625, 24.033203125, 25.44140625, 26.849609375, 28.2578125, 29.666015625, 31.07421875, 32.482421875, 33.890625, 35.298828125, 36.70703125, 38.115234375, 39.5234375, 40.931640625, 42.33984375, 43.748046875, 45.15625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 12.0, 13.0, 10.0, 20.0, 18.0, 37.0, 45.0, 58.0, 104.0, 107.0, 167.0, 274.0, 381.0, 663.0, 1053.0, 1913.0, 3780.0, 8094.0, 21816.0, 72238.0, 386025.0, 432949.0, 78114.0, 23096.0, 8738.0, 3879.0, 1925.0, 1072.0, 600.0, 428.0, 285.0, 195.0, 115.0, 98.0, 60.0, 41.0, 30.0, 26.0, 18.0, 17.0, 5.0, 6.0, 7.0, 4.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0], "bins": [-102.6875, -99.755859375, -96.82421875, -93.892578125, -90.9609375, -88.029296875, -85.09765625, -82.166015625, -79.234375, -76.302734375, -73.37109375, -70.439453125, -67.5078125, -64.576171875, -61.64453125, -58.712890625, -55.78125, -52.849609375, -49.91796875, -46.986328125, -44.0546875, -41.123046875, -38.19140625, -35.259765625, -32.328125, -29.396484375, -26.46484375, -23.533203125, -20.6015625, -17.669921875, -14.73828125, -11.806640625, -8.875, -5.943359375, -3.01171875, -0.080078125, 2.8515625, 5.783203125, 8.71484375, 11.646484375, 14.578125, 17.509765625, 20.44140625, 23.373046875, 26.3046875, 29.236328125, 32.16796875, 35.099609375, 38.03125, 40.962890625, 43.89453125, 46.826171875, 49.7578125, 52.689453125, 55.62109375, 58.552734375, 61.484375, 64.416015625, 67.34765625, 70.279296875, 73.2109375, 76.142578125, 79.07421875, 82.005859375, 84.9375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 8.0, 12.0, 15.0, 17.0, 19.0, 22.0, 37.0, 41.0, 47.0, 38.0, 53.0, 50.0, 52.0, 57.0, 77.0, 66.0, 47.0, 46.0, 41.0, 50.0, 39.0, 27.0, 32.0, 23.0, 20.0, 15.0, 10.0, 8.0, 7.0, 9.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.125, -187.783203125, -182.44140625, -177.099609375, -171.7578125, -166.416015625, -161.07421875, -155.732421875, -150.390625, -145.048828125, -139.70703125, -134.365234375, -129.0234375, -123.681640625, -118.33984375, -112.998046875, -107.65625, -102.314453125, -96.97265625, -91.630859375, -86.2890625, -80.947265625, -75.60546875, -70.263671875, -64.921875, -59.580078125, -54.23828125, -48.896484375, -43.5546875, -38.212890625, -32.87109375, -27.529296875, -22.1875, -16.845703125, -11.50390625, -6.162109375, -0.8203125, 4.521484375, 9.86328125, 15.205078125, 20.546875, 25.888671875, 31.23046875, 36.572265625, 41.9140625, 47.255859375, 52.59765625, 57.939453125, 63.28125, 68.623046875, 73.96484375, 79.306640625, 84.6484375, 89.990234375, 95.33203125, 100.673828125, 106.015625, 111.357421875, 116.69921875, 122.041015625, 127.3828125, 132.724609375, 138.06640625, 143.408203125, 148.75]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 8.0, 5.0, 4.0, 7.0, 12.0, 19.0, 31.0, 49.0, 72.0, 157.0, 356.0, 1101.0, 4598.0, 47778.0, 954694.0, 34049.0, 3931.0, 984.0, 352.0, 158.0, 68.0, 38.0, 30.0, 18.0, 12.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.5, -101.65625, -97.8125, -93.96875, -90.125, -86.28125, -82.4375, -78.59375, -74.75, -70.90625, -67.0625, -63.21875, -59.375, -55.53125, -51.6875, -47.84375, -44.0, -40.15625, -36.3125, -32.46875, -28.625, -24.78125, -20.9375, -17.09375, -13.25, -9.40625, -5.5625, -1.71875, 2.125, 5.96875, 9.8125, 13.65625, 17.5, 21.34375, 25.1875, 29.03125, 32.875, 36.71875, 40.5625, 44.40625, 48.25, 52.09375, 55.9375, 59.78125, 63.625, 67.46875, 71.3125, 75.15625, 79.0, 82.84375, 86.6875, 90.53125, 94.375, 98.21875, 102.0625, 105.90625, 109.75, 113.59375, 117.4375, 121.28125, 125.125, 128.96875, 132.8125, 136.65625, 140.5]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 8.0, 8.0, 25.0, 22.0, 23.0, 39.0, 53.0, 84.0, 144.0, 212.0, 159.0, 80.0, 46.0, 20.0, 19.0, 15.0, 12.0, 5.0, 9.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0136566162109375, -0.013141870498657227, -0.012627124786376953, -0.01211237907409668, -0.011597633361816406, -0.011082887649536133, -0.01056814193725586, -0.010053396224975586, -0.009538650512695312, -0.009023904800415039, -0.008509159088134766, -0.007994413375854492, -0.007479667663574219, -0.006964921951293945, -0.006450176239013672, -0.0059354305267333984, -0.005420684814453125, -0.0049059391021728516, -0.004391193389892578, -0.0038764476776123047, -0.0033617019653320312, -0.002846956253051758, -0.0023322105407714844, -0.001817464828491211, -0.0013027191162109375, -0.0007879734039306641, -0.0002732276916503906, 0.0002415180206298828, 0.0007562637329101562, 0.0012710094451904297, 0.0017857551574707031, 0.0023005008697509766, 0.00281524658203125, 0.0033299922943115234, 0.003844738006591797, 0.00435948371887207, 0.004874229431152344, 0.005388975143432617, 0.005903720855712891, 0.006418466567993164, 0.0069332122802734375, 0.007447957992553711, 0.007962703704833984, 0.008477449417114258, 0.008992195129394531, 0.009506940841674805, 0.010021686553955078, 0.010536432266235352, 0.011051177978515625, 0.011565923690795898, 0.012080669403076172, 0.012595415115356445, 0.013110160827636719, 0.013624906539916992, 0.014139652252197266, 0.014654397964477539, 0.015169143676757812, 0.015683889389038086, 0.01619863510131836, 0.016713380813598633, 0.017228126525878906, 0.01774287223815918, 0.018257617950439453, 0.018772363662719727, 0.019287109375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 8.0, 5.0, 4.0, 5.0, 17.0, 23.0, 25.0, 42.0, 60.0, 93.0, 161.0, 293.0, 466.0, 1076.0, 2846.0, 12254.0, 205873.0, 795902.0, 22184.0, 4280.0, 1433.0, 650.0, 323.0, 179.0, 103.0, 83.0, 43.0, 28.0, 25.0, 22.0, 14.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-104.0625, -100.611328125, -97.16015625, -93.708984375, -90.2578125, -86.806640625, -83.35546875, -79.904296875, -76.453125, -73.001953125, -69.55078125, -66.099609375, -62.6484375, -59.197265625, -55.74609375, -52.294921875, -48.84375, -45.392578125, -41.94140625, -38.490234375, -35.0390625, -31.587890625, -28.13671875, -24.685546875, -21.234375, -17.783203125, -14.33203125, -10.880859375, -7.4296875, -3.978515625, -0.52734375, 2.923828125, 6.375, 9.826171875, 13.27734375, 16.728515625, 20.1796875, 23.630859375, 27.08203125, 30.533203125, 33.984375, 37.435546875, 40.88671875, 44.337890625, 47.7890625, 51.240234375, 54.69140625, 58.142578125, 61.59375, 65.044921875, 68.49609375, 71.947265625, 75.3984375, 78.849609375, 82.30078125, 85.751953125, 89.203125, 92.654296875, 96.10546875, 99.556640625, 103.0078125, 106.458984375, 109.91015625, 113.361328125, 116.8125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 11.0, 11.0, 17.0, 24.0, 50.0, 90.0, 220.0, 257.0, 151.0, 67.0, 34.0, 19.0, 20.0, 13.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.375, -86.943359375, -83.51171875, -80.080078125, -76.6484375, -73.216796875, -69.78515625, -66.353515625, -62.921875, -59.490234375, -56.05859375, -52.626953125, -49.1953125, -45.763671875, -42.33203125, -38.900390625, -35.46875, -32.037109375, -28.60546875, -25.173828125, -21.7421875, -18.310546875, -14.87890625, -11.447265625, -8.015625, -4.583984375, -1.15234375, 2.279296875, 5.7109375, 9.142578125, 12.57421875, 16.005859375, 19.4375, 22.869140625, 26.30078125, 29.732421875, 33.1640625, 36.595703125, 40.02734375, 43.458984375, 46.890625, 50.322265625, 53.75390625, 57.185546875, 60.6171875, 64.048828125, 67.48046875, 70.912109375, 74.34375, 77.775390625, 81.20703125, 84.638671875, 88.0703125, 91.501953125, 94.93359375, 98.365234375, 101.796875, 105.228515625, 108.66015625, 112.091796875, 115.5234375, 118.955078125, 122.38671875, 125.818359375, 129.25]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 30.0, 157.0, 447.0, 263.0, 67.0, 22.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1050.192626953125, -941.7163696289062, -833.2401123046875, -724.7638549804688, -616.28759765625, -507.81134033203125, -399.3350830078125, -290.85882568359375, -182.382568359375, -73.90631103515625, 34.5699462890625, 143.04620361328125, 251.5224609375, 359.99871826171875, 468.4749755859375, 576.9512329101562, 685.427490234375, 793.9037475585938, 902.3800048828125, 1010.8562622070312, 1119.33251953125, 1227.808837890625, 1336.2850341796875, 1444.76123046875, 1553.237548828125, 1661.7138671875, 1770.1900634765625, 1878.666259765625, 1987.142578125, 2095.618896484375, 2204.09521484375, 2312.5712890625, 2421.04736328125, 2529.523681640625, 2638.0, 2746.47607421875, 2854.952392578125, 2963.4287109375, 3071.90478515625, 3180.381103515625, 3288.857421875, 3397.333740234375, 3505.81005859375, 3614.2861328125, 3722.762451171875, 3831.23876953125, 3939.71484375, 4048.191162109375, 4156.66748046875, 4265.1435546875, 4373.6201171875, 4482.09619140625, 4590.572265625, 4699.048828125, 4807.52490234375, 4916.00146484375, 5024.4775390625, 5132.95361328125, 5241.43017578125, 5349.90625, 5458.3828125, 5566.85888671875, 5675.3349609375, 5783.8115234375, 5892.28759765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 9.0, 3.0, 8.0, 8.0, 14.0, 9.0, 11.0, 13.0, 22.0, 26.0, 24.0, 36.0, 27.0, 32.0, 37.0, 39.0, 40.0, 54.0, 43.0, 53.0, 55.0, 37.0, 55.0, 40.0, 46.0, 37.0, 42.0, 30.0, 30.0, 17.0, 26.0, 17.0, 16.0, 10.0, 12.0, 11.0, 5.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-621.1695556640625, -600.2647705078125, -579.3599853515625, -558.4552001953125, -537.5504150390625, -516.6456298828125, -495.7408447265625, -474.8360595703125, -453.9312744140625, -433.0264892578125, -412.1217041015625, -391.2169189453125, -370.3121337890625, -349.4073486328125, -328.5025634765625, -307.5977783203125, -286.6929626464844, -265.7881774902344, -244.88339233398438, -223.97860717773438, -203.07382202148438, -182.16903686523438, -161.2642364501953, -140.3594512939453, -119.45466613769531, -98.54988098144531, -77.64509582519531, -56.74030303955078, -35.83551788330078, -14.930732727050781, 5.97406005859375, 26.87884521484375, 47.78363037109375, 68.68841552734375, 89.59320068359375, 110.49799346923828, 131.40277099609375, 152.30755615234375, 173.2123565673828, 194.1171417236328, 215.0219268798828, 235.9267120361328, 256.8315124511719, 277.7362976074219, 298.6410827636719, 319.5458679199219, 340.4506530761719, 361.3554382324219, 382.2602233886719, 403.1650085449219, 424.0697937011719, 444.9745788574219, 465.8793640136719, 486.7841491699219, 507.68896484375, 528.59375, 549.49853515625, 570.4033203125, 591.30810546875, 612.212890625, 633.11767578125, 654.0224609375, 674.92724609375, 695.83203125, 716.73681640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 6.0, 15.0, 13.0, 20.0, 27.0, 46.0, 64.0, 72.0, 125.0, 127.0, 188.0, 252.0, 357.0, 524.0, 766.0, 1063.0, 1690.0, 2684.0, 4578.0, 8676.0, 19378.0, 65604.0, 903120.0, 2988755.0, 141421.0, 28522.0, 11413.0, 5606.0, 3251.0, 1884.0, 1180.0, 837.0, 533.0, 412.0, 267.0, 195.0, 158.0, 105.0, 96.0, 60.0, 57.0, 45.0, 25.0, 15.0, 12.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.9375, -68.5068359375, -66.076171875, -63.6455078125, -61.21484375, -58.7841796875, -56.353515625, -53.9228515625, -51.4921875, -49.0615234375, -46.630859375, -44.2001953125, -41.76953125, -39.3388671875, -36.908203125, -34.4775390625, -32.046875, -29.6162109375, -27.185546875, -24.7548828125, -22.32421875, -19.8935546875, -17.462890625, -15.0322265625, -12.6015625, -10.1708984375, -7.740234375, -5.3095703125, -2.87890625, -0.4482421875, 1.982421875, 4.4130859375, 6.84375, 9.2744140625, 11.705078125, 14.1357421875, 16.56640625, 18.9970703125, 21.427734375, 23.8583984375, 26.2890625, 28.7197265625, 31.150390625, 33.5810546875, 36.01171875, 38.4423828125, 40.873046875, 43.3037109375, 45.734375, 48.1650390625, 50.595703125, 53.0263671875, 55.45703125, 57.8876953125, 60.318359375, 62.7490234375, 65.1796875, 67.6103515625, 70.041015625, 72.4716796875, 74.90234375, 77.3330078125, 79.763671875, 82.1943359375, 84.625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 7.0, 14.0, 28.0, 17.0, 25.0, 40.0, 39.0, 45.0, 61.0, 68.0, 77.0, 75.0, 76.0, 78.0, 68.0, 63.0, 44.0, 36.0, 32.0, 25.0, 12.0, 13.0, 12.0, 11.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.03125, -33.60693359375, -32.1826171875, -30.75830078125, -29.333984375, -27.90966796875, -26.4853515625, -25.06103515625, -23.63671875, -22.21240234375, -20.7880859375, -19.36376953125, -17.939453125, -16.51513671875, -15.0908203125, -13.66650390625, -12.2421875, -10.81787109375, -9.3935546875, -7.96923828125, -6.544921875, -5.12060546875, -3.6962890625, -2.27197265625, -0.84765625, 0.57666015625, 2.0009765625, 3.42529296875, 4.849609375, 6.27392578125, 7.6982421875, 9.12255859375, 10.546875, 11.97119140625, 13.3955078125, 14.81982421875, 16.244140625, 17.66845703125, 19.0927734375, 20.51708984375, 21.94140625, 23.36572265625, 24.7900390625, 26.21435546875, 27.638671875, 29.06298828125, 30.4873046875, 31.91162109375, 33.3359375, 34.76025390625, 36.1845703125, 37.60888671875, 39.033203125, 40.45751953125, 41.8818359375, 43.30615234375, 44.73046875, 46.15478515625, 47.5791015625, 49.00341796875, 50.427734375, 51.85205078125, 53.2763671875, 54.70068359375, 56.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 11.0, 6.0, 8.0, 13.0, 20.0, 16.0, 41.0, 73.0, 88.0, 162.0, 246.0, 428.0, 781.0, 1588.0, 3545.0, 8788.0, 25957.0, 110839.0, 3336524.0, 621263.0, 56466.0, 16364.0, 5971.0, 2408.0, 1174.0, 613.0, 348.0, 210.0, 111.0, 79.0, 38.0, 37.0, 16.0, 16.0, 9.0, 7.0, 3.0, 4.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.875, -98.337890625, -94.80078125, -91.263671875, -87.7265625, -84.189453125, -80.65234375, -77.115234375, -73.578125, -70.041015625, -66.50390625, -62.966796875, -59.4296875, -55.892578125, -52.35546875, -48.818359375, -45.28125, -41.744140625, -38.20703125, -34.669921875, -31.1328125, -27.595703125, -24.05859375, -20.521484375, -16.984375, -13.447265625, -9.91015625, -6.373046875, -2.8359375, 0.701171875, 4.23828125, 7.775390625, 11.3125, 14.849609375, 18.38671875, 21.923828125, 25.4609375, 28.998046875, 32.53515625, 36.072265625, 39.609375, 43.146484375, 46.68359375, 50.220703125, 53.7578125, 57.294921875, 60.83203125, 64.369140625, 67.90625, 71.443359375, 74.98046875, 78.517578125, 82.0546875, 85.591796875, 89.12890625, 92.666015625, 96.203125, 99.740234375, 103.27734375, 106.814453125, 110.3515625, 113.888671875, 117.42578125, 120.962890625, 124.5]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 12.0, 13.0, 11.0, 24.0, 24.0, 36.0, 37.0, 63.0, 102.0, 205.0, 526.0, 1404.0, 898.0, 321.0, 132.0, 76.0, 41.0, 30.0, 17.0, 23.0, 17.0, 10.0, 11.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.625, -136.6904296875, -132.755859375, -128.8212890625, -124.88671875, -120.9521484375, -117.017578125, -113.0830078125, -109.1484375, -105.2138671875, -101.279296875, -97.3447265625, -93.41015625, -89.4755859375, -85.541015625, -81.6064453125, -77.671875, -73.7373046875, -69.802734375, -65.8681640625, -61.93359375, -57.9990234375, -54.064453125, -50.1298828125, -46.1953125, -42.2607421875, -38.326171875, -34.3916015625, -30.45703125, -26.5224609375, -22.587890625, -18.6533203125, -14.71875, -10.7841796875, -6.849609375, -2.9150390625, 1.01953125, 4.9541015625, 8.888671875, 12.8232421875, 16.7578125, 20.6923828125, 24.626953125, 28.5615234375, 32.49609375, 36.4306640625, 40.365234375, 44.2998046875, 48.234375, 52.1689453125, 56.103515625, 60.0380859375, 63.97265625, 67.9072265625, 71.841796875, 75.7763671875, 79.7109375, 83.6455078125, 87.580078125, 91.5146484375, 95.44921875, 99.3837890625, 103.318359375, 107.2529296875, 111.1875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 20.0, 25.0, 51.0, 106.0, 196.0, 292.0, 181.0, 62.0, 26.0, 14.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1828.8466796875, -1782.648193359375, -1736.44970703125, -1690.251220703125, -1644.052734375, -1597.854248046875, -1551.65576171875, -1505.457275390625, -1459.2587890625, -1413.060302734375, -1366.86181640625, -1320.663330078125, -1274.46484375, -1228.266357421875, -1182.06787109375, -1135.869384765625, -1089.6710205078125, -1043.4725341796875, -997.2740478515625, -951.0755615234375, -904.8770751953125, -858.6785888671875, -812.4801635742188, -766.2816772460938, -720.0831909179688, -673.8847045898438, -627.6862182617188, -581.48779296875, -535.289306640625, -489.0907897949219, -442.892333984375, -396.69384765625, -350.495361328125, -304.296875, -258.098388671875, -211.89993286132812, -165.70144653320312, -119.50296020507812, -73.30450439453125, -27.10601806640625, 19.09246826171875, 65.29094696044922, 111.48942565917969, 157.68789672851562, 203.88638305664062, 250.08486938476562, 296.2833251953125, 342.4818115234375, 388.6802978515625, 434.8787841796875, 481.0772705078125, 527.2757568359375, 573.4742431640625, 619.6727294921875, 665.8711547851562, 712.0696411132812, 758.2681274414062, 804.4666137695312, 850.6651000976562, 896.863525390625, 943.06201171875, 989.260498046875, 1035.458984375, 1081.657470703125, 1127.85595703125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 5.0, 7.0, 6.0, 17.0, 23.0, 20.0, 16.0, 19.0, 25.0, 28.0, 32.0, 31.0, 31.0, 40.0, 42.0, 42.0, 39.0, 37.0, 46.0, 50.0, 33.0, 42.0, 44.0, 44.0, 43.0, 25.0, 29.0, 35.0, 22.0, 23.0, 10.0, 13.0, 9.0, 13.0, 8.0, 11.0, 10.0, 7.0, 5.0, 2.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-447.6067810058594, -433.94354248046875, -420.28033447265625, -406.61712646484375, -392.9538879394531, -379.2906494140625, -365.62744140625, -351.9642333984375, -338.3009948730469, -324.63775634765625, -310.97454833984375, -297.31134033203125, -283.6481018066406, -269.98486328125, -256.3216552734375, -242.65843200683594, -228.99520874023438, -215.3319854736328, -201.66876220703125, -188.0055389404297, -174.34231567382812, -160.67909240722656, -147.015869140625, -133.35264587402344, -119.68942260742188, -106.02619934082031, -92.36297607421875, -78.69975280761719, -65.03652954101562, -51.37330627441406, -37.7100830078125, -24.046859741210938, -10.38360595703125, 3.2796173095703125, 16.942840576171875, 30.606063842773438, 44.269287109375, 57.93251037597656, 71.59573364257812, 85.25895690917969, 98.92218017578125, 112.58540344238281, 126.24862670898438, 139.91184997558594, 153.5750732421875, 167.23829650878906, 180.90151977539062, 194.5647430419922, 208.22796630859375, 221.8911895751953, 235.55441284179688, 249.21763610839844, 262.880859375, 276.5440673828125, 290.2073059082031, 303.87054443359375, 317.53375244140625, 331.19696044921875, 344.8601989746094, 358.5234375, 372.1866455078125, 385.849853515625, 399.5130920410156, 413.17633056640625, 426.83953857421875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 10.0, 10.0, 17.0, 14.0, 30.0, 47.0, 67.0, 89.0, 143.0, 223.0, 329.0, 457.0, 697.0, 978.0, 1595.0, 2476.0, 4149.0, 6958.0, 12624.0, 24743.0, 53562.0, 140373.0, 394937.0, 243737.0, 83951.0, 35681.0, 17201.0, 9233.0, 5166.0, 3165.0, 2007.0, 1241.0, 863.0, 518.0, 368.0, 261.0, 187.0, 129.0, 102.0, 62.0, 40.0, 33.0, 22.0, 19.0, 13.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-71.875, -69.7451171875, -67.615234375, -65.4853515625, -63.35546875, -61.2255859375, -59.095703125, -56.9658203125, -54.8359375, -52.7060546875, -50.576171875, -48.4462890625, -46.31640625, -44.1865234375, -42.056640625, -39.9267578125, -37.796875, -35.6669921875, -33.537109375, -31.4072265625, -29.27734375, -27.1474609375, -25.017578125, -22.8876953125, -20.7578125, -18.6279296875, -16.498046875, -14.3681640625, -12.23828125, -10.1083984375, -7.978515625, -5.8486328125, -3.71875, -1.5888671875, 0.541015625, 2.6708984375, 4.80078125, 6.9306640625, 9.060546875, 11.1904296875, 13.3203125, 15.4501953125, 17.580078125, 19.7099609375, 21.83984375, 23.9697265625, 26.099609375, 28.2294921875, 30.359375, 32.4892578125, 34.619140625, 36.7490234375, 38.87890625, 41.0087890625, 43.138671875, 45.2685546875, 47.3984375, 49.5283203125, 51.658203125, 53.7880859375, 55.91796875, 58.0478515625, 60.177734375, 62.3076171875, 64.4375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 10.0, 15.0, 19.0, 22.0, 23.0, 28.0, 32.0, 46.0, 49.0, 45.0, 60.0, 69.0, 58.0, 64.0, 72.0, 49.0, 54.0, 50.0, 37.0, 33.0, 35.0, 20.0, 21.0, 19.0, 19.0, 11.0, 6.0, 1.0, 4.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.90625, -31.630859375, -30.35546875, -29.080078125, -27.8046875, -26.529296875, -25.25390625, -23.978515625, -22.703125, -21.427734375, -20.15234375, -18.876953125, -17.6015625, -16.326171875, -15.05078125, -13.775390625, -12.5, -11.224609375, -9.94921875, -8.673828125, -7.3984375, -6.123046875, -4.84765625, -3.572265625, -2.296875, -1.021484375, 0.25390625, 1.529296875, 2.8046875, 4.080078125, 5.35546875, 6.630859375, 7.90625, 9.181640625, 10.45703125, 11.732421875, 13.0078125, 14.283203125, 15.55859375, 16.833984375, 18.109375, 19.384765625, 20.66015625, 21.935546875, 23.2109375, 24.486328125, 25.76171875, 27.037109375, 28.3125, 29.587890625, 30.86328125, 32.138671875, 33.4140625, 34.689453125, 35.96484375, 37.240234375, 38.515625, 39.791015625, 41.06640625, 42.341796875, 43.6171875, 44.892578125, 46.16796875, 47.443359375, 48.71875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 11.0, 18.0, 18.0, 29.0, 35.0, 51.0, 67.0, 108.0, 202.0, 293.0, 433.0, 809.0, 1624.0, 3957.0, 12396.0, 60986.0, 732676.0, 197690.0, 25240.0, 6758.0, 2447.0, 1122.0, 594.0, 314.0, 219.0, 121.0, 97.0, 67.0, 46.0, 28.0, 25.0, 15.0, 12.0, 7.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-161.625, -156.689453125, -151.75390625, -146.818359375, -141.8828125, -136.947265625, -132.01171875, -127.076171875, -122.140625, -117.205078125, -112.26953125, -107.333984375, -102.3984375, -97.462890625, -92.52734375, -87.591796875, -82.65625, -77.720703125, -72.78515625, -67.849609375, -62.9140625, -57.978515625, -53.04296875, -48.107421875, -43.171875, -38.236328125, -33.30078125, -28.365234375, -23.4296875, -18.494140625, -13.55859375, -8.623046875, -3.6875, 1.248046875, 6.18359375, 11.119140625, 16.0546875, 20.990234375, 25.92578125, 30.861328125, 35.796875, 40.732421875, 45.66796875, 50.603515625, 55.5390625, 60.474609375, 65.41015625, 70.345703125, 75.28125, 80.216796875, 85.15234375, 90.087890625, 95.0234375, 99.958984375, 104.89453125, 109.830078125, 114.765625, 119.701171875, 124.63671875, 129.572265625, 134.5078125, 139.443359375, 144.37890625, 149.314453125, 154.25]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 9.0, 6.0, 9.0, 13.0, 16.0, 23.0, 26.0, 32.0, 31.0, 34.0, 45.0, 42.0, 35.0, 34.0, 55.0, 50.0, 49.0, 42.0, 54.0, 52.0, 47.0, 42.0, 32.0, 35.0, 36.0, 21.0, 21.0, 19.0, 9.0, 9.0, 8.0, 9.0, 8.0, 4.0, 6.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-184.875, -180.048828125, -175.22265625, -170.396484375, -165.5703125, -160.744140625, -155.91796875, -151.091796875, -146.265625, -141.439453125, -136.61328125, -131.787109375, -126.9609375, -122.134765625, -117.30859375, -112.482421875, -107.65625, -102.830078125, -98.00390625, -93.177734375, -88.3515625, -83.525390625, -78.69921875, -73.873046875, -69.046875, -64.220703125, -59.39453125, -54.568359375, -49.7421875, -44.916015625, -40.08984375, -35.263671875, -30.4375, -25.611328125, -20.78515625, -15.958984375, -11.1328125, -6.306640625, -1.48046875, 3.345703125, 8.171875, 12.998046875, 17.82421875, 22.650390625, 27.4765625, 32.302734375, 37.12890625, 41.955078125, 46.78125, 51.607421875, 56.43359375, 61.259765625, 66.0859375, 70.912109375, 75.73828125, 80.564453125, 85.390625, 90.216796875, 95.04296875, 99.869140625, 104.6953125, 109.521484375, 114.34765625, 119.173828125, 124.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 7.0, 7.0, 11.0, 17.0, 13.0, 32.0, 41.0, 65.0, 119.0, 186.0, 320.0, 610.0, 1194.0, 2696.0, 6509.0, 21063.0, 134098.0, 761233.0, 93140.0, 16884.0, 5457.0, 2407.0, 1097.0, 512.0, 289.0, 207.0, 124.0, 71.0, 43.0, 33.0, 17.0, 11.0, 13.0, 6.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.375, -42.7568359375, -41.138671875, -39.5205078125, -37.90234375, -36.2841796875, -34.666015625, -33.0478515625, -31.4296875, -29.8115234375, -28.193359375, -26.5751953125, -24.95703125, -23.3388671875, -21.720703125, -20.1025390625, -18.484375, -16.8662109375, -15.248046875, -13.6298828125, -12.01171875, -10.3935546875, -8.775390625, -7.1572265625, -5.5390625, -3.9208984375, -2.302734375, -0.6845703125, 0.93359375, 2.5517578125, 4.169921875, 5.7880859375, 7.40625, 9.0244140625, 10.642578125, 12.2607421875, 13.87890625, 15.4970703125, 17.115234375, 18.7333984375, 20.3515625, 21.9697265625, 23.587890625, 25.2060546875, 26.82421875, 28.4423828125, 30.060546875, 31.6787109375, 33.296875, 34.9150390625, 36.533203125, 38.1513671875, 39.76953125, 41.3876953125, 43.005859375, 44.6240234375, 46.2421875, 47.8603515625, 49.478515625, 51.0966796875, 52.71484375, 54.3330078125, 55.951171875, 57.5693359375, 59.1875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 7.0, 16.0, 18.0, 34.0, 37.0, 61.0, 100.0, 120.0, 187.0, 144.0, 89.0, 51.0, 45.0, 16.0, 11.0, 10.0, 11.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018157958984375, -0.017614126205444336, -0.017070293426513672, -0.016526460647583008, -0.015982627868652344, -0.01543879508972168, -0.014894962310791016, -0.014351129531860352, -0.013807296752929688, -0.013263463973999023, -0.01271963119506836, -0.012175798416137695, -0.011631965637207031, -0.011088132858276367, -0.010544300079345703, -0.010000467300415039, -0.009456634521484375, -0.008912801742553711, -0.008368968963623047, -0.007825136184692383, -0.007281303405761719, -0.006737470626831055, -0.006193637847900391, -0.0056498050689697266, -0.0051059722900390625, -0.0045621395111083984, -0.004018306732177734, -0.0034744739532470703, -0.0029306411743164062, -0.002386808395385742, -0.0018429756164550781, -0.001299142837524414, -0.00075531005859375, -0.00021147727966308594, 0.0003323554992675781, 0.0008761882781982422, 0.0014200210571289062, 0.0019638538360595703, 0.0025076866149902344, 0.0030515193939208984, 0.0035953521728515625, 0.0041391849517822266, 0.004683017730712891, 0.005226850509643555, 0.005770683288574219, 0.006314516067504883, 0.006858348846435547, 0.007402181625366211, 0.007946014404296875, 0.008489847183227539, 0.009033679962158203, 0.009577512741088867, 0.010121345520019531, 0.010665178298950195, 0.01120901107788086, 0.011752843856811523, 0.012296676635742188, 0.012840509414672852, 0.013384342193603516, 0.01392817497253418, 0.014472007751464844, 0.015015840530395508, 0.015559673309326172, 0.016103506088256836, 0.0166473388671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 3.0, 10.0, 12.0, 14.0, 20.0, 29.0, 42.0, 56.0, 81.0, 126.0, 201.0, 353.0, 647.0, 1119.0, 2386.0, 6094.0, 19918.0, 113039.0, 726313.0, 143128.0, 22680.0, 6694.0, 2646.0, 1288.0, 631.0, 363.0, 221.0, 137.0, 95.0, 59.0, 38.0, 29.0, 22.0, 11.0, 18.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.0, -43.57373046875, -42.1474609375, -40.72119140625, -39.294921875, -37.86865234375, -36.4423828125, -35.01611328125, -33.58984375, -32.16357421875, -30.7373046875, -29.31103515625, -27.884765625, -26.45849609375, -25.0322265625, -23.60595703125, -22.1796875, -20.75341796875, -19.3271484375, -17.90087890625, -16.474609375, -15.04833984375, -13.6220703125, -12.19580078125, -10.76953125, -9.34326171875, -7.9169921875, -6.49072265625, -5.064453125, -3.63818359375, -2.2119140625, -0.78564453125, 0.640625, 2.06689453125, 3.4931640625, 4.91943359375, 6.345703125, 7.77197265625, 9.1982421875, 10.62451171875, 12.05078125, 13.47705078125, 14.9033203125, 16.32958984375, 17.755859375, 19.18212890625, 20.6083984375, 22.03466796875, 23.4609375, 24.88720703125, 26.3134765625, 27.73974609375, 29.166015625, 30.59228515625, 32.0185546875, 33.44482421875, 34.87109375, 36.29736328125, 37.7236328125, 39.14990234375, 40.576171875, 42.00244140625, 43.4287109375, 44.85498046875, 46.28125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 10.0, 6.0, 12.0, 16.0, 12.0, 15.0, 23.0, 47.0, 50.0, 60.0, 75.0, 82.0, 77.0, 91.0, 74.0, 80.0, 56.0, 55.0, 41.0, 25.0, 15.0, 13.0, 10.0, 10.0, 12.0, 4.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-48.1875, -46.85107421875, -45.5146484375, -44.17822265625, -42.841796875, -41.50537109375, -40.1689453125, -38.83251953125, -37.49609375, -36.15966796875, -34.8232421875, -33.48681640625, -32.150390625, -30.81396484375, -29.4775390625, -28.14111328125, -26.8046875, -25.46826171875, -24.1318359375, -22.79541015625, -21.458984375, -20.12255859375, -18.7861328125, -17.44970703125, -16.11328125, -14.77685546875, -13.4404296875, -12.10400390625, -10.767578125, -9.43115234375, -8.0947265625, -6.75830078125, -5.421875, -4.08544921875, -2.7490234375, -1.41259765625, -0.076171875, 1.26025390625, 2.5966796875, 3.93310546875, 5.26953125, 6.60595703125, 7.9423828125, 9.27880859375, 10.615234375, 11.95166015625, 13.2880859375, 14.62451171875, 15.9609375, 17.29736328125, 18.6337890625, 19.97021484375, 21.306640625, 22.64306640625, 23.9794921875, 25.31591796875, 26.65234375, 27.98876953125, 29.3251953125, 30.66162109375, 31.998046875, 33.33447265625, 34.6708984375, 36.00732421875, 37.34375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 12.0, 8.0, 9.0, 28.0, 52.0, 59.0, 93.0, 138.0, 155.0, 150.0, 87.0, 72.0, 51.0, 28.0, 20.0, 16.0, 7.0, 2.0, 1.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-859.085205078125, -830.8626708984375, -802.6400756835938, -774.4175415039062, -746.1949462890625, -717.972412109375, -689.7498779296875, -661.52734375, -633.3047485351562, -605.0822143554688, -576.859619140625, -548.6370849609375, -520.41455078125, -492.19195556640625, -463.96942138671875, -435.7468566894531, -407.5242919921875, -379.3017272949219, -351.07916259765625, -322.85662841796875, -294.6340637207031, -266.4114990234375, -238.18894958496094, -209.96640014648438, -181.74383544921875, -153.52127075195312, -125.29872131347656, -97.07616424560547, -68.85360717773438, -40.63104248046875, -12.408493041992188, 15.814056396484375, 44.03662109375, 72.2591781616211, 100.48173522949219, 128.70428466796875, 156.92684936523438, 185.1494140625, 213.37196350097656, 241.59451293945312, 269.81707763671875, 298.0396423339844, 326.26220703125, 354.4847412109375, 382.7073059082031, 410.92987060546875, 439.15240478515625, 467.3749694824219, 495.5975341796875, 523.820068359375, 552.0426635742188, 580.2651977539062, 608.48779296875, 636.7103271484375, 664.932861328125, 693.1553955078125, 721.3779907226562, 749.6005249023438, 777.8231201171875, 806.045654296875, 834.2681884765625, 862.4907836914062, 890.7133178710938, 918.9359130859375, 947.158447265625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 5.0, 8.0, 12.0, 14.0, 13.0, 21.0, 24.0, 23.0, 20.0, 23.0, 29.0, 29.0, 41.0, 47.0, 66.0, 55.0, 65.0, 48.0, 56.0, 49.0, 35.0, 35.0, 31.0, 31.0, 35.0, 32.0, 29.0, 19.0, 14.0, 18.0, 9.0, 8.0, 10.0, 14.0, 6.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-621.265380859375, -602.0185546875, -582.7717895507812, -563.5249633789062, -544.2781372070312, -525.0313110351562, -505.7845458984375, -486.5377197265625, -467.2908935546875, -448.0440979003906, -428.7972717285156, -409.55047607421875, -390.30364990234375, -371.0568542480469, -351.81005859375, -332.563232421875, -313.3164367675781, -294.06964111328125, -274.82281494140625, -255.57601928710938, -236.32919311523438, -217.0823974609375, -197.83558654785156, -178.58877563476562, -159.3419647216797, -140.09515380859375, -120.84834289550781, -101.6015396118164, -82.35472869873047, -63.10791778564453, -43.861114501953125, -24.614303588867188, -5.36749267578125, 13.879316329956055, 33.12612533569336, 52.37293243408203, 71.61974334716797, 90.8665542602539, 110.11335754394531, 129.36016845703125, 148.6069793701172, 167.85379028320312, 187.10060119628906, 206.347412109375, 225.59420776367188, 244.84103393554688, 264.08782958984375, 283.33465576171875, 302.5814514160156, 321.8282470703125, 341.0750732421875, 360.3218688964844, 379.5686950683594, 398.81549072265625, 418.06231689453125, 437.3091125488281, 456.555908203125, 475.8027038574219, 495.0495300292969, 514.2963256835938, 533.5431518554688, 552.7899780273438, 572.0367431640625, 591.2835693359375, 610.5303955078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 16.0, 12.0, 16.0, 27.0, 31.0, 35.0, 61.0, 127.0, 247.0, 494.0, 1273.0, 3488.0, 13045.0, 183165.0, 3873333.0, 102921.0, 10835.0, 3048.0, 1105.0, 462.0, 213.0, 104.0, 59.0, 21.0, 37.0, 18.0, 11.0, 9.0, 11.0, 4.0, 8.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-122.125, -118.2392578125, -114.353515625, -110.4677734375, -106.58203125, -102.6962890625, -98.810546875, -94.9248046875, -91.0390625, -87.1533203125, -83.267578125, -79.3818359375, -75.49609375, -71.6103515625, -67.724609375, -63.8388671875, -59.953125, -56.0673828125, -52.181640625, -48.2958984375, -44.41015625, -40.5244140625, -36.638671875, -32.7529296875, -28.8671875, -24.9814453125, -21.095703125, -17.2099609375, -13.32421875, -9.4384765625, -5.552734375, -1.6669921875, 2.21875, 6.1044921875, 9.990234375, 13.8759765625, 17.76171875, 21.6474609375, 25.533203125, 29.4189453125, 33.3046875, 37.1904296875, 41.076171875, 44.9619140625, 48.84765625, 52.7333984375, 56.619140625, 60.5048828125, 64.390625, 68.2763671875, 72.162109375, 76.0478515625, 79.93359375, 83.8193359375, 87.705078125, 91.5908203125, 95.4765625, 99.3623046875, 103.248046875, 107.1337890625, 111.01953125, 114.9052734375, 118.791015625, 122.6767578125, 126.5625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 2.0, 6.0, 13.0, 8.0, 9.0, 9.0, 19.0, 15.0, 21.0, 16.0, 29.0, 40.0, 37.0, 40.0, 55.0, 47.0, 44.0, 73.0, 69.0, 63.0, 42.0, 56.0, 55.0, 45.0, 27.0, 25.0, 24.0, 12.0, 18.0, 20.0, 15.0, 10.0, 10.0, 4.0, 12.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-38.15625, -36.99853515625, -35.8408203125, -34.68310546875, -33.525390625, -32.36767578125, -31.2099609375, -30.05224609375, -28.89453125, -27.73681640625, -26.5791015625, -25.42138671875, -24.263671875, -23.10595703125, -21.9482421875, -20.79052734375, -19.6328125, -18.47509765625, -17.3173828125, -16.15966796875, -15.001953125, -13.84423828125, -12.6865234375, -11.52880859375, -10.37109375, -9.21337890625, -8.0556640625, -6.89794921875, -5.740234375, -4.58251953125, -3.4248046875, -2.26708984375, -1.109375, 0.04833984375, 1.2060546875, 2.36376953125, 3.521484375, 4.67919921875, 5.8369140625, 6.99462890625, 8.15234375, 9.31005859375, 10.4677734375, 11.62548828125, 12.783203125, 13.94091796875, 15.0986328125, 16.25634765625, 17.4140625, 18.57177734375, 19.7294921875, 20.88720703125, 22.044921875, 23.20263671875, 24.3603515625, 25.51806640625, 26.67578125, 27.83349609375, 28.9912109375, 30.14892578125, 31.306640625, 32.46435546875, 33.6220703125, 34.77978515625, 35.9375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 13.0, 6.0, 15.0, 27.0, 30.0, 49.0, 86.0, 122.0, 233.0, 298.0, 488.0, 780.0, 1290.0, 2312.0, 4807.0, 11148.0, 31970.0, 148658.0, 2966738.0, 910060.0, 77751.0, 21124.0, 7936.0, 3680.0, 1825.0, 1062.0, 615.0, 399.0, 237.0, 162.0, 118.0, 64.0, 54.0, 38.0, 30.0, 13.0, 11.0, 9.0, 2.0, 8.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.75, -80.1494140625, -77.548828125, -74.9482421875, -72.34765625, -69.7470703125, -67.146484375, -64.5458984375, -61.9453125, -59.3447265625, -56.744140625, -54.1435546875, -51.54296875, -48.9423828125, -46.341796875, -43.7412109375, -41.140625, -38.5400390625, -35.939453125, -33.3388671875, -30.73828125, -28.1376953125, -25.537109375, -22.9365234375, -20.3359375, -17.7353515625, -15.134765625, -12.5341796875, -9.93359375, -7.3330078125, -4.732421875, -2.1318359375, 0.46875, 3.0693359375, 5.669921875, 8.2705078125, 10.87109375, 13.4716796875, 16.072265625, 18.6728515625, 21.2734375, 23.8740234375, 26.474609375, 29.0751953125, 31.67578125, 34.2763671875, 36.876953125, 39.4775390625, 42.078125, 44.6787109375, 47.279296875, 49.8798828125, 52.48046875, 55.0810546875, 57.681640625, 60.2822265625, 62.8828125, 65.4833984375, 68.083984375, 70.6845703125, 73.28515625, 75.8857421875, 78.486328125, 81.0869140625, 83.6875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 4.0, 11.0, 21.0, 22.0, 23.0, 59.0, 82.0, 155.0, 335.0, 823.0, 1243.0, 640.0, 276.0, 137.0, 81.0, 44.0, 24.0, 26.0, 17.0, 5.0, 8.0, 5.0, 5.0, 4.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.6875, -102.2119140625, -98.736328125, -95.2607421875, -91.78515625, -88.3095703125, -84.833984375, -81.3583984375, -77.8828125, -74.4072265625, -70.931640625, -67.4560546875, -63.98046875, -60.5048828125, -57.029296875, -53.5537109375, -50.078125, -46.6025390625, -43.126953125, -39.6513671875, -36.17578125, -32.7001953125, -29.224609375, -25.7490234375, -22.2734375, -18.7978515625, -15.322265625, -11.8466796875, -8.37109375, -4.8955078125, -1.419921875, 2.0556640625, 5.53125, 9.0068359375, 12.482421875, 15.9580078125, 19.43359375, 22.9091796875, 26.384765625, 29.8603515625, 33.3359375, 36.8115234375, 40.287109375, 43.7626953125, 47.23828125, 50.7138671875, 54.189453125, 57.6650390625, 61.140625, 64.6162109375, 68.091796875, 71.5673828125, 75.04296875, 78.5185546875, 81.994140625, 85.4697265625, 88.9453125, 92.4208984375, 95.896484375, 99.3720703125, 102.84765625, 106.3232421875, 109.798828125, 113.2744140625, 116.75]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 7.0, 12.0, 19.0, 10.0, 50.0, 68.0, 102.0, 115.0, 147.0, 147.0, 109.0, 66.0, 49.0, 31.0, 20.0, 9.0, 10.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-392.81005859375, -373.8019104003906, -354.7937316894531, -335.78558349609375, -316.77740478515625, -297.7692565917969, -278.7611083984375, -259.7529296875, -240.74478149414062, -221.7366180419922, -202.72845458984375, -183.72030639648438, -164.71214294433594, -145.7039794921875, -126.6958236694336, -107.68766784667969, -88.67950439453125, -69.67134094238281, -50.663185119628906, -31.655025482177734, -12.646865844726562, 6.361297607421875, 25.36945343017578, 44.37760925292969, 63.385772705078125, 82.39393615722656, 101.40209197998047, 120.41024780273438, 139.4184112548828, 158.42657470703125, 177.43472290039062, 196.44288635253906, 215.45111083984375, 234.4592742919922, 253.46743774414062, 272.4755859375, 291.4837646484375, 310.4919128417969, 329.50006103515625, 348.50823974609375, 367.5163879394531, 386.5245361328125, 405.53271484375, 424.5408630371094, 443.54901123046875, 462.55718994140625, 481.5653381347656, 500.573486328125, 519.5816650390625, 538.58984375, 557.5979614257812, 576.6061401367188, 595.6143188476562, 614.6224365234375, 633.630615234375, 652.6387939453125, 671.64697265625, 690.6551513671875, 709.6632690429688, 728.6714477539062, 747.6796264648438, 766.687744140625, 785.6959228515625, 804.7041015625, 823.7122192382812]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 2.0, 8.0, 9.0, 11.0, 11.0, 17.0, 17.0, 22.0, 29.0, 13.0, 31.0, 30.0, 30.0, 38.0, 44.0, 41.0, 46.0, 36.0, 51.0, 42.0, 44.0, 49.0, 33.0, 52.0, 36.0, 39.0, 32.0, 25.0, 20.0, 26.0, 21.0, 20.0, 14.0, 13.0, 12.0, 9.0, 4.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-320.2158508300781, -309.3950500488281, -298.57427978515625, -287.75347900390625, -276.93267822265625, -266.11187744140625, -255.2910919189453, -244.47030639648438, -233.64950561523438, -222.82870483398438, -212.00791931152344, -201.1871337890625, -190.3663330078125, -179.5455322265625, -168.72474670410156, -157.90396118164062, -147.08316040039062, -136.26235961914062, -125.44157409667969, -114.62078094482422, -103.79998779296875, -92.97919464111328, -82.15840148925781, -71.33760833740234, -60.516815185546875, -49.696022033691406, -38.87522888183594, -28.05443572998047, -17.233642578125, -6.412849426269531, 4.4079437255859375, 15.228736877441406, 26.049560546875, 36.87035369873047, 47.69114685058594, 58.511940002441406, 69.33273315429688, 80.15352630615234, 90.97431945800781, 101.79511260986328, 112.61590576171875, 123.43669891357422, 134.2574920654297, 145.07827758789062, 155.89907836914062, 166.71987915039062, 177.54066467285156, 188.3614501953125, 199.1822509765625, 210.0030517578125, 220.82383728027344, 231.64462280273438, 242.46542358398438, 253.28622436523438, 264.10699462890625, 274.92779541015625, 285.74859619140625, 296.56939697265625, 307.39019775390625, 318.2109680175781, 329.0317687988281, 339.8525695800781, 350.67333984375, 361.494140625, 372.31494140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 18.0, 9.0, 16.0, 18.0, 37.0, 39.0, 69.0, 111.0, 158.0, 223.0, 382.0, 528.0, 934.0, 1588.0, 2943.0, 5377.0, 11101.0, 25030.0, 63904.0, 186270.0, 446536.0, 189974.0, 64009.0, 25402.0, 11251.0, 5460.0, 2900.0, 1689.0, 941.0, 571.0, 337.0, 238.0, 121.0, 102.0, 68.0, 53.0, 24.0, 35.0, 15.0, 17.0, 10.0, 4.0, 9.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-70.1875, -68.0283203125, -65.869140625, -63.7099609375, -61.55078125, -59.3916015625, -57.232421875, -55.0732421875, -52.9140625, -50.7548828125, -48.595703125, -46.4365234375, -44.27734375, -42.1181640625, -39.958984375, -37.7998046875, -35.640625, -33.4814453125, -31.322265625, -29.1630859375, -27.00390625, -24.8447265625, -22.685546875, -20.5263671875, -18.3671875, -16.2080078125, -14.048828125, -11.8896484375, -9.73046875, -7.5712890625, -5.412109375, -3.2529296875, -1.09375, 1.0654296875, 3.224609375, 5.3837890625, 7.54296875, 9.7021484375, 11.861328125, 14.0205078125, 16.1796875, 18.3388671875, 20.498046875, 22.6572265625, 24.81640625, 26.9755859375, 29.134765625, 31.2939453125, 33.453125, 35.6123046875, 37.771484375, 39.9306640625, 42.08984375, 44.2490234375, 46.408203125, 48.5673828125, 50.7265625, 52.8857421875, 55.044921875, 57.2041015625, 59.36328125, 61.5224609375, 63.681640625, 65.8408203125, 68.0]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 9.0, 14.0, 16.0, 12.0, 12.0, 19.0, 16.0, 25.0, 29.0, 24.0, 34.0, 34.0, 37.0, 37.0, 37.0, 52.0, 39.0, 50.0, 57.0, 39.0, 52.0, 47.0, 48.0, 40.0, 24.0, 34.0, 21.0, 25.0, 12.0, 25.0, 9.0, 13.0, 15.0, 9.0, 4.0, 4.0, 6.0, 2.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.609375, -30.542236328125, -29.47509765625, -28.407958984375, -27.3408203125, -26.273681640625, -25.20654296875, -24.139404296875, -23.072265625, -22.005126953125, -20.93798828125, -19.870849609375, -18.8037109375, -17.736572265625, -16.66943359375, -15.602294921875, -14.53515625, -13.468017578125, -12.40087890625, -11.333740234375, -10.2666015625, -9.199462890625, -8.13232421875, -7.065185546875, -5.998046875, -4.930908203125, -3.86376953125, -2.796630859375, -1.7294921875, -0.662353515625, 0.40478515625, 1.471923828125, 2.5390625, 3.606201171875, 4.67333984375, 5.740478515625, 6.8076171875, 7.874755859375, 8.94189453125, 10.009033203125, 11.076171875, 12.143310546875, 13.21044921875, 14.277587890625, 15.3447265625, 16.411865234375, 17.47900390625, 18.546142578125, 19.61328125, 20.680419921875, 21.74755859375, 22.814697265625, 23.8818359375, 24.948974609375, 26.01611328125, 27.083251953125, 28.150390625, 29.217529296875, 30.28466796875, 31.351806640625, 32.4189453125, 33.486083984375, 34.55322265625, 35.620361328125, 36.6875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 16.0, 17.0, 21.0, 30.0, 54.0, 79.0, 112.0, 196.0, 361.0, 715.0, 1601.0, 4388.0, 16287.0, 90939.0, 754227.0, 147165.0, 22667.0, 5823.0, 2027.0, 840.0, 400.0, 208.0, 137.0, 76.0, 44.0, 29.0, 26.0, 7.0, 17.0, 13.0, 3.0, 9.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.25, -134.3828125, -129.515625, -124.6484375, -119.78125, -114.9140625, -110.046875, -105.1796875, -100.3125, -95.4453125, -90.578125, -85.7109375, -80.84375, -75.9765625, -71.109375, -66.2421875, -61.375, -56.5078125, -51.640625, -46.7734375, -41.90625, -37.0390625, -32.171875, -27.3046875, -22.4375, -17.5703125, -12.703125, -7.8359375, -2.96875, 1.8984375, 6.765625, 11.6328125, 16.5, 21.3671875, 26.234375, 31.1015625, 35.96875, 40.8359375, 45.703125, 50.5703125, 55.4375, 60.3046875, 65.171875, 70.0390625, 74.90625, 79.7734375, 84.640625, 89.5078125, 94.375, 99.2421875, 104.109375, 108.9765625, 113.84375, 118.7109375, 123.578125, 128.4453125, 133.3125, 138.1796875, 143.046875, 147.9140625, 152.78125, 157.6484375, 162.515625, 167.3828125, 172.25]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 4.0, 8.0, 12.0, 9.0, 11.0, 14.0, 15.0, 25.0, 20.0, 34.0, 30.0, 52.0, 48.0, 43.0, 38.0, 43.0, 48.0, 52.0, 57.0, 63.0, 50.0, 42.0, 44.0, 45.0, 33.0, 28.0, 24.0, 23.0, 18.0, 12.0, 12.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.25, -158.201171875, -153.15234375, -148.103515625, -143.0546875, -138.005859375, -132.95703125, -127.908203125, -122.859375, -117.810546875, -112.76171875, -107.712890625, -102.6640625, -97.615234375, -92.56640625, -87.517578125, -82.46875, -77.419921875, -72.37109375, -67.322265625, -62.2734375, -57.224609375, -52.17578125, -47.126953125, -42.078125, -37.029296875, -31.98046875, -26.931640625, -21.8828125, -16.833984375, -11.78515625, -6.736328125, -1.6875, 3.361328125, 8.41015625, 13.458984375, 18.5078125, 23.556640625, 28.60546875, 33.654296875, 38.703125, 43.751953125, 48.80078125, 53.849609375, 58.8984375, 63.947265625, 68.99609375, 74.044921875, 79.09375, 84.142578125, 89.19140625, 94.240234375, 99.2890625, 104.337890625, 109.38671875, 114.435546875, 119.484375, 124.533203125, 129.58203125, 134.630859375, 139.6796875, 144.728515625, 149.77734375, 154.826171875, 159.875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 5.0, 11.0, 16.0, 24.0, 28.0, 58.0, 75.0, 122.0, 223.0, 394.0, 691.0, 1554.0, 3915.0, 12000.0, 61114.0, 719539.0, 211415.0, 25690.0, 6857.0, 2371.0, 1126.0, 533.0, 334.0, 172.0, 110.0, 57.0, 32.0, 20.0, 13.0, 12.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-79.875, -77.5771484375, -75.279296875, -72.9814453125, -70.68359375, -68.3857421875, -66.087890625, -63.7900390625, -61.4921875, -59.1943359375, -56.896484375, -54.5986328125, -52.30078125, -50.0029296875, -47.705078125, -45.4072265625, -43.109375, -40.8115234375, -38.513671875, -36.2158203125, -33.91796875, -31.6201171875, -29.322265625, -27.0244140625, -24.7265625, -22.4287109375, -20.130859375, -17.8330078125, -15.53515625, -13.2373046875, -10.939453125, -8.6416015625, -6.34375, -4.0458984375, -1.748046875, 0.5498046875, 2.84765625, 5.1455078125, 7.443359375, 9.7412109375, 12.0390625, 14.3369140625, 16.634765625, 18.9326171875, 21.23046875, 23.5283203125, 25.826171875, 28.1240234375, 30.421875, 32.7197265625, 35.017578125, 37.3154296875, 39.61328125, 41.9111328125, 44.208984375, 46.5068359375, 48.8046875, 51.1025390625, 53.400390625, 55.6982421875, 57.99609375, 60.2939453125, 62.591796875, 64.8896484375, 67.1875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 13.0, 24.0, 50.0, 91.0, 247.0, 291.0, 128.0, 50.0, 31.0, 17.0, 15.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.054443359375, -0.053238868713378906, -0.05203437805175781, -0.05082988739013672, -0.049625396728515625, -0.04842090606689453, -0.04721641540527344, -0.046011924743652344, -0.04480743408203125, -0.043602943420410156, -0.04239845275878906, -0.04119396209716797, -0.039989471435546875, -0.03878498077392578, -0.03758049011230469, -0.036375999450683594, -0.0351715087890625, -0.033967018127441406, -0.03276252746582031, -0.03155803680419922, -0.030353546142578125, -0.02914905548095703, -0.027944564819335938, -0.026740074157714844, -0.02553558349609375, -0.024331092834472656, -0.023126602172851562, -0.02192211151123047, -0.020717620849609375, -0.01951313018798828, -0.018308639526367188, -0.017104148864746094, -0.015899658203125, -0.014695167541503906, -0.013490676879882812, -0.012286186218261719, -0.011081695556640625, -0.009877204895019531, -0.008672714233398438, -0.007468223571777344, -0.00626373291015625, -0.005059242248535156, -0.0038547515869140625, -0.0026502609252929688, -0.001445770263671875, -0.00024127960205078125, 0.0009632110595703125, 0.0021677017211914062, 0.0033721923828125, 0.004576683044433594, 0.0057811737060546875, 0.006985664367675781, 0.008190155029296875, 0.009394645690917969, 0.010599136352539062, 0.011803627014160156, 0.01300811767578125, 0.014212608337402344, 0.015417098999023438, 0.01662158966064453, 0.017826080322265625, 0.01903057098388672, 0.020235061645507812, 0.021439552307128906, 0.02264404296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 9.0, 15.0, 24.0, 22.0, 41.0, 78.0, 107.0, 172.0, 365.0, 668.0, 1350.0, 3169.0, 8856.0, 35408.0, 241637.0, 650614.0, 80703.0, 16169.0, 5056.0, 2012.0, 971.0, 439.0, 253.0, 154.0, 74.0, 54.0, 28.0, 18.0, 20.0, 18.0, 11.0, 4.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.25, -50.52197265625, -48.7939453125, -47.06591796875, -45.337890625, -43.60986328125, -41.8818359375, -40.15380859375, -38.42578125, -36.69775390625, -34.9697265625, -33.24169921875, -31.513671875, -29.78564453125, -28.0576171875, -26.32958984375, -24.6015625, -22.87353515625, -21.1455078125, -19.41748046875, -17.689453125, -15.96142578125, -14.2333984375, -12.50537109375, -10.77734375, -9.04931640625, -7.3212890625, -5.59326171875, -3.865234375, -2.13720703125, -0.4091796875, 1.31884765625, 3.046875, 4.77490234375, 6.5029296875, 8.23095703125, 9.958984375, 11.68701171875, 13.4150390625, 15.14306640625, 16.87109375, 18.59912109375, 20.3271484375, 22.05517578125, 23.783203125, 25.51123046875, 27.2392578125, 28.96728515625, 30.6953125, 32.42333984375, 34.1513671875, 35.87939453125, 37.607421875, 39.33544921875, 41.0634765625, 42.79150390625, 44.51953125, 46.24755859375, 47.9755859375, 49.70361328125, 51.431640625, 53.15966796875, 54.8876953125, 56.61572265625, 58.34375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 5.0, 11.0, 17.0, 13.0, 32.0, 48.0, 43.0, 79.0, 65.0, 98.0, 108.0, 92.0, 91.0, 67.0, 66.0, 36.0, 25.0, 17.0, 15.0, 20.0, 9.0, 3.0, 9.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.0625, -60.15234375, -58.2421875, -56.33203125, -54.421875, -52.51171875, -50.6015625, -48.69140625, -46.78125, -44.87109375, -42.9609375, -41.05078125, -39.140625, -37.23046875, -35.3203125, -33.41015625, -31.5, -29.58984375, -27.6796875, -25.76953125, -23.859375, -21.94921875, -20.0390625, -18.12890625, -16.21875, -14.30859375, -12.3984375, -10.48828125, -8.578125, -6.66796875, -4.7578125, -2.84765625, -0.9375, 0.97265625, 2.8828125, 4.79296875, 6.703125, 8.61328125, 10.5234375, 12.43359375, 14.34375, 16.25390625, 18.1640625, 20.07421875, 21.984375, 23.89453125, 25.8046875, 27.71484375, 29.625, 31.53515625, 33.4453125, 35.35546875, 37.265625, 39.17578125, 41.0859375, 42.99609375, 44.90625, 46.81640625, 48.7265625, 50.63671875, 52.546875, 54.45703125, 56.3671875, 58.27734375, 60.1875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 9.0, 21.0, 64.0, 191.0, 314.0, 216.0, 108.0, 40.0, 19.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1606.042724609375, -1551.7738037109375, -1497.5048828125, -1443.2359619140625, -1388.967041015625, -1334.6981201171875, -1280.42919921875, -1226.1602783203125, -1171.891357421875, -1117.6224365234375, -1063.353515625, -1009.0845947265625, -954.815673828125, -900.5467529296875, -846.27783203125, -792.0089111328125, -737.739990234375, -683.4710693359375, -629.2021484375, -574.9332275390625, -520.664306640625, -466.3953857421875, -412.12646484375, -357.8575439453125, -303.588623046875, -249.3197021484375, -195.05078125, -140.7818603515625, -86.512939453125, -32.2440185546875, 22.02490234375, 76.2938232421875, 130.5628662109375, 184.831787109375, 239.1007080078125, 293.36962890625, 347.6385498046875, 401.907470703125, 456.1763916015625, 510.4453125, 564.7142333984375, 618.983154296875, 673.2520751953125, 727.52099609375, 781.7899169921875, 836.058837890625, 890.3277587890625, 944.5966796875, 998.8656005859375, 1053.134521484375, 1107.4034423828125, 1161.67236328125, 1215.9412841796875, 1270.210205078125, 1324.4791259765625, 1378.748046875, 1433.0169677734375, 1487.285888671875, 1541.5548095703125, 1595.82373046875, 1650.0926513671875, 1704.361572265625, 1758.6304931640625, 1812.8994140625, 1867.1683349609375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 11.0, 7.0, 6.0, 15.0, 10.0, 17.0, 13.0, 20.0, 22.0, 31.0, 20.0, 29.0, 38.0, 27.0, 42.0, 42.0, 37.0, 41.0, 59.0, 52.0, 49.0, 32.0, 39.0, 39.0, 38.0, 34.0, 29.0, 21.0, 31.0, 20.0, 16.0, 18.0, 15.0, 12.0, 20.0, 8.0, 8.0, 11.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-614.193115234375, -596.7333374023438, -579.2735595703125, -561.8137817382812, -544.35400390625, -526.8941650390625, -509.43438720703125, -491.974609375, -474.51483154296875, -457.0550537109375, -439.59527587890625, -422.1354675292969, -404.6756896972656, -387.2159118652344, -369.756103515625, -352.29632568359375, -334.8365478515625, -317.37677001953125, -299.9169921875, -282.4571838378906, -264.9974060058594, -247.53762817382812, -230.0778350830078, -212.6180419921875, -195.15826416015625, -177.698486328125, -160.2386932373047, -142.77890014648438, -125.31912231445312, -107.85933685302734, -90.39955139160156, -72.93976593017578, -55.47998046875, -38.02019500732422, -20.560409545898438, -3.1006240844726562, 14.359161376953125, 31.818946838378906, 49.27873229980469, 66.73851776123047, 84.19830322265625, 101.65808868408203, 119.11787414550781, 136.57766723632812, 154.03744506835938, 171.49722290039062, 188.95701599121094, 206.41680908203125, 223.8765869140625, 241.33636474609375, 258.796142578125, 276.2559509277344, 293.7157287597656, 311.1755065917969, 328.63531494140625, 346.0950927734375, 363.55487060546875, 381.0146484375, 398.47442626953125, 415.9342346191406, 433.3940124511719, 450.8537902832031, 468.3135986328125, 485.77337646484375, 503.233154296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 7.0, 9.0, 6.0, 7.0, 19.0, 21.0, 25.0, 44.0, 60.0, 80.0, 107.0, 156.0, 262.0, 406.0, 633.0, 1064.0, 1674.0, 3061.0, 5722.0, 11498.0, 26539.0, 83376.0, 341821.0, 1637369.0, 1615702.0, 337040.0, 79085.0, 25243.0, 10819.0, 5333.0, 2781.0, 1573.0, 938.0, 618.0, 404.0, 215.0, 151.0, 105.0, 82.0, 65.0, 47.0, 36.0, 18.0, 23.0, 13.0, 7.0, 8.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 5.0, 0.0, 1.0], "bins": [-42.125, -40.80810546875, -39.4912109375, -38.17431640625, -36.857421875, -35.54052734375, -34.2236328125, -32.90673828125, -31.58984375, -30.27294921875, -28.9560546875, -27.63916015625, -26.322265625, -25.00537109375, -23.6884765625, -22.37158203125, -21.0546875, -19.73779296875, -18.4208984375, -17.10400390625, -15.787109375, -14.47021484375, -13.1533203125, -11.83642578125, -10.51953125, -9.20263671875, -7.8857421875, -6.56884765625, -5.251953125, -3.93505859375, -2.6181640625, -1.30126953125, 0.015625, 1.33251953125, 2.6494140625, 3.96630859375, 5.283203125, 6.60009765625, 7.9169921875, 9.23388671875, 10.55078125, 11.86767578125, 13.1845703125, 14.50146484375, 15.818359375, 17.13525390625, 18.4521484375, 19.76904296875, 21.0859375, 22.40283203125, 23.7197265625, 25.03662109375, 26.353515625, 27.67041015625, 28.9873046875, 30.30419921875, 31.62109375, 32.93798828125, 34.2548828125, 35.57177734375, 36.888671875, 38.20556640625, 39.5224609375, 40.83935546875, 42.15625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 3.0, 6.0, 6.0, 12.0, 18.0, 20.0, 15.0, 26.0, 18.0, 39.0, 22.0, 31.0, 38.0, 32.0, 64.0, 44.0, 45.0, 59.0, 60.0, 44.0, 49.0, 48.0, 50.0, 36.0, 38.0, 25.0, 20.0, 23.0, 13.0, 15.0, 16.0, 17.0, 8.0, 10.0, 7.0, 4.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.859375, -26.784912109375, -25.71044921875, -24.635986328125, -23.5615234375, -22.487060546875, -21.41259765625, -20.338134765625, -19.263671875, -18.189208984375, -17.11474609375, -16.040283203125, -14.9658203125, -13.891357421875, -12.81689453125, -11.742431640625, -10.66796875, -9.593505859375, -8.51904296875, -7.444580078125, -6.3701171875, -5.295654296875, -4.22119140625, -3.146728515625, -2.072265625, -0.997802734375, 0.07666015625, 1.151123046875, 2.2255859375, 3.300048828125, 4.37451171875, 5.448974609375, 6.5234375, 7.597900390625, 8.67236328125, 9.746826171875, 10.8212890625, 11.895751953125, 12.97021484375, 14.044677734375, 15.119140625, 16.193603515625, 17.26806640625, 18.342529296875, 19.4169921875, 20.491455078125, 21.56591796875, 22.640380859375, 23.71484375, 24.789306640625, 25.86376953125, 26.938232421875, 28.0126953125, 29.087158203125, 30.16162109375, 31.236083984375, 32.310546875, 33.385009765625, 34.45947265625, 35.533935546875, 36.6083984375, 37.682861328125, 38.75732421875, 39.831787109375, 40.90625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 5.0, 9.0, 9.0, 18.0, 31.0, 29.0, 72.0, 75.0, 119.0, 190.0, 308.0, 521.0, 940.0, 1683.0, 3561.0, 8626.0, 26466.0, 109246.0, 1789763.0, 2092117.0, 118253.0, 26661.0, 8451.0, 3434.0, 1606.0, 804.0, 471.0, 279.0, 157.0, 124.0, 85.0, 39.0, 46.0, 19.0, 15.0, 10.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-102.9375, -99.72265625, -96.5078125, -93.29296875, -90.078125, -86.86328125, -83.6484375, -80.43359375, -77.21875, -74.00390625, -70.7890625, -67.57421875, -64.359375, -61.14453125, -57.9296875, -54.71484375, -51.5, -48.28515625, -45.0703125, -41.85546875, -38.640625, -35.42578125, -32.2109375, -28.99609375, -25.78125, -22.56640625, -19.3515625, -16.13671875, -12.921875, -9.70703125, -6.4921875, -3.27734375, -0.0625, 3.15234375, 6.3671875, 9.58203125, 12.796875, 16.01171875, 19.2265625, 22.44140625, 25.65625, 28.87109375, 32.0859375, 35.30078125, 38.515625, 41.73046875, 44.9453125, 48.16015625, 51.375, 54.58984375, 57.8046875, 61.01953125, 64.234375, 67.44921875, 70.6640625, 73.87890625, 77.09375, 80.30859375, 83.5234375, 86.73828125, 89.953125, 93.16796875, 96.3828125, 99.59765625, 102.8125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 11.0, 9.0, 21.0, 28.0, 31.0, 53.0, 72.0, 75.0, 164.0, 383.0, 800.0, 1065.0, 599.0, 291.0, 159.0, 89.0, 74.0, 38.0, 25.0, 19.0, 16.0, 6.0, 8.0, 11.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-142.5, -138.08984375, -133.6796875, -129.26953125, -124.859375, -120.44921875, -116.0390625, -111.62890625, -107.21875, -102.80859375, -98.3984375, -93.98828125, -89.578125, -85.16796875, -80.7578125, -76.34765625, -71.9375, -67.52734375, -63.1171875, -58.70703125, -54.296875, -49.88671875, -45.4765625, -41.06640625, -36.65625, -32.24609375, -27.8359375, -23.42578125, -19.015625, -14.60546875, -10.1953125, -5.78515625, -1.375, 3.03515625, 7.4453125, 11.85546875, 16.265625, 20.67578125, 25.0859375, 29.49609375, 33.90625, 38.31640625, 42.7265625, 47.13671875, 51.546875, 55.95703125, 60.3671875, 64.77734375, 69.1875, 73.59765625, 78.0078125, 82.41796875, 86.828125, 91.23828125, 95.6484375, 100.05859375, 104.46875, 108.87890625, 113.2890625, 117.69921875, 122.109375, 126.51953125, 130.9296875, 135.33984375, 139.75]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 14.0, 14.0, 30.0, 91.0, 173.0, 246.0, 216.0, 128.0, 40.0, 26.0, 10.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2329.535888671875, -2277.539794921875, -2225.54345703125, -2173.54736328125, -2121.55126953125, -2069.554931640625, -2017.558837890625, -1965.5626220703125, -1913.56640625, -1861.5701904296875, -1809.5740966796875, -1757.577880859375, -1705.5816650390625, -1653.58544921875, -1601.58935546875, -1549.5931396484375, -1497.5970458984375, -1445.600830078125, -1393.604736328125, -1341.6085205078125, -1289.6123046875, -1237.6162109375, -1185.6199951171875, -1133.623779296875, -1081.627685546875, -1029.6314697265625, -977.6353149414062, -925.63916015625, -873.6429443359375, -821.6467895507812, -769.650634765625, -717.6544189453125, -665.6580810546875, -613.6619262695312, -561.6657104492188, -509.6695556640625, -457.6733703613281, -405.67718505859375, -353.6810302734375, -301.6848449707031, -249.68865966796875, -197.69247436523438, -145.69630432128906, -93.70013427734375, -41.703948974609375, 10.292236328125, 62.28839111328125, 114.28457641601562, 166.28076171875, 218.27694702148438, 270.27313232421875, 322.269287109375, 374.2654724121094, 426.26165771484375, 478.2578125, 530.2540283203125, 582.2501831054688, 634.246337890625, 686.2425537109375, 738.2387084960938, 790.23486328125, 842.2310791015625, 894.2272338867188, 946.223388671875, 998.2196044921875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 13.0, 9.0, 7.0, 6.0, 15.0, 20.0, 30.0, 23.0, 26.0, 31.0, 33.0, 34.0, 44.0, 41.0, 62.0, 55.0, 64.0, 39.0, 57.0, 31.0, 52.0, 34.0, 33.0, 41.0, 29.0, 32.0, 23.0, 22.0, 22.0, 17.0, 14.0, 5.0, 12.0, 5.0, 3.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-600.299560546875, -582.5486450195312, -564.7977294921875, -547.0468139648438, -529.2958984375, -511.54498291015625, -493.7940673828125, -476.04315185546875, -458.292236328125, -440.54132080078125, -422.7904052734375, -405.03948974609375, -387.28857421875, -369.53765869140625, -351.7867431640625, -334.03582763671875, -316.2848815917969, -298.5339660644531, -280.7830505371094, -263.0321350097656, -245.28121948242188, -227.53030395507812, -209.7793731689453, -192.02845764160156, -174.2775421142578, -156.52662658691406, -138.7757110595703, -121.02478790283203, -103.27387237548828, -85.52295684814453, -67.77203369140625, -50.0211181640625, -32.27020263671875, -14.519285202026367, 3.2316322326660156, 20.98255157470703, 38.73346710205078, 56.48438262939453, 74.23530578613281, 91.98622131347656, 109.73713684082031, 127.48805236816406, 145.2389678955078, 162.98989868164062, 180.74081420898438, 198.49172973632812, 216.24264526367188, 233.99356079101562, 251.74447631835938, 269.4953918457031, 287.2463073730469, 304.9972229003906, 322.7481384277344, 340.4990539550781, 358.25, 376.00091552734375, 393.7518310546875, 411.50274658203125, 429.253662109375, 447.00457763671875, 464.7554931640625, 482.50640869140625, 500.25732421875, 518.0082397460938, 535.7591552734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 12.0, 17.0, 14.0, 30.0, 49.0, 60.0, 92.0, 118.0, 166.0, 324.0, 546.0, 795.0, 1369.0, 2291.0, 3907.0, 6995.0, 12940.0, 25408.0, 50653.0, 106499.0, 238442.0, 313772.0, 145050.0, 67864.0, 33471.0, 16497.0, 9029.0, 5049.0, 2811.0, 1649.0, 953.0, 635.0, 332.0, 257.0, 139.0, 104.0, 54.0, 47.0, 36.0, 34.0, 12.0, 11.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.875, -54.083984375, -52.29296875, -50.501953125, -48.7109375, -46.919921875, -45.12890625, -43.337890625, -41.546875, -39.755859375, -37.96484375, -36.173828125, -34.3828125, -32.591796875, -30.80078125, -29.009765625, -27.21875, -25.427734375, -23.63671875, -21.845703125, -20.0546875, -18.263671875, -16.47265625, -14.681640625, -12.890625, -11.099609375, -9.30859375, -7.517578125, -5.7265625, -3.935546875, -2.14453125, -0.353515625, 1.4375, 3.228515625, 5.01953125, 6.810546875, 8.6015625, 10.392578125, 12.18359375, 13.974609375, 15.765625, 17.556640625, 19.34765625, 21.138671875, 22.9296875, 24.720703125, 26.51171875, 28.302734375, 30.09375, 31.884765625, 33.67578125, 35.466796875, 37.2578125, 39.048828125, 40.83984375, 42.630859375, 44.421875, 46.212890625, 48.00390625, 49.794921875, 51.5859375, 53.376953125, 55.16796875, 56.958984375, 58.75]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 7.0, 7.0, 13.0, 11.0, 13.0, 15.0, 20.0, 28.0, 24.0, 34.0, 41.0, 42.0, 49.0, 57.0, 52.0, 54.0, 50.0, 50.0, 57.0, 44.0, 57.0, 39.0, 27.0, 35.0, 35.0, 28.0, 13.0, 24.0, 17.0, 11.0, 12.0, 11.0, 9.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.5625, -47.31103515625, -46.0595703125, -44.80810546875, -43.556640625, -42.30517578125, -41.0537109375, -39.80224609375, -38.55078125, -37.29931640625, -36.0478515625, -34.79638671875, -33.544921875, -32.29345703125, -31.0419921875, -29.79052734375, -28.5390625, -27.28759765625, -26.0361328125, -24.78466796875, -23.533203125, -22.28173828125, -21.0302734375, -19.77880859375, -18.52734375, -17.27587890625, -16.0244140625, -14.77294921875, -13.521484375, -12.27001953125, -11.0185546875, -9.76708984375, -8.515625, -7.26416015625, -6.0126953125, -4.76123046875, -3.509765625, -2.25830078125, -1.0068359375, 0.24462890625, 1.49609375, 2.74755859375, 3.9990234375, 5.25048828125, 6.501953125, 7.75341796875, 9.0048828125, 10.25634765625, 11.5078125, 12.75927734375, 14.0107421875, 15.26220703125, 16.513671875, 17.76513671875, 19.0166015625, 20.26806640625, 21.51953125, 22.77099609375, 24.0224609375, 25.27392578125, 26.525390625, 27.77685546875, 29.0283203125, 30.27978515625, 31.53125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 7.0, 13.0, 11.0, 13.0, 22.0, 52.0, 38.0, 64.0, 100.0, 165.0, 239.0, 413.0, 740.0, 1487.0, 3644.0, 12819.0, 96721.0, 809573.0, 102051.0, 13321.0, 3666.0, 1458.0, 720.0, 419.0, 281.0, 158.0, 108.0, 70.0, 57.0, 37.0, 18.0, 18.0, 20.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-254.75, -248.134765625, -241.51953125, -234.904296875, -228.2890625, -221.673828125, -215.05859375, -208.443359375, -201.828125, -195.212890625, -188.59765625, -181.982421875, -175.3671875, -168.751953125, -162.13671875, -155.521484375, -148.90625, -142.291015625, -135.67578125, -129.060546875, -122.4453125, -115.830078125, -109.21484375, -102.599609375, -95.984375, -89.369140625, -82.75390625, -76.138671875, -69.5234375, -62.908203125, -56.29296875, -49.677734375, -43.0625, -36.447265625, -29.83203125, -23.216796875, -16.6015625, -9.986328125, -3.37109375, 3.244140625, 9.859375, 16.474609375, 23.08984375, 29.705078125, 36.3203125, 42.935546875, 49.55078125, 56.166015625, 62.78125, 69.396484375, 76.01171875, 82.626953125, 89.2421875, 95.857421875, 102.47265625, 109.087890625, 115.703125, 122.318359375, 128.93359375, 135.548828125, 142.1640625, 148.779296875, 155.39453125, 162.009765625, 168.625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 4.0, 14.0, 16.0, 22.0, 24.0, 19.0, 24.0, 45.0, 40.0, 47.0, 46.0, 58.0, 65.0, 66.0, 56.0, 52.0, 61.0, 32.0, 42.0, 42.0, 32.0, 38.0, 27.0, 27.0, 21.0, 15.0, 15.0, 11.0, 9.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-266.25, -259.634765625, -253.01953125, -246.404296875, -239.7890625, -233.173828125, -226.55859375, -219.943359375, -213.328125, -206.712890625, -200.09765625, -193.482421875, -186.8671875, -180.251953125, -173.63671875, -167.021484375, -160.40625, -153.791015625, -147.17578125, -140.560546875, -133.9453125, -127.330078125, -120.71484375, -114.099609375, -107.484375, -100.869140625, -94.25390625, -87.638671875, -81.0234375, -74.408203125, -67.79296875, -61.177734375, -54.5625, -47.947265625, -41.33203125, -34.716796875, -28.1015625, -21.486328125, -14.87109375, -8.255859375, -1.640625, 4.974609375, 11.58984375, 18.205078125, 24.8203125, 31.435546875, 38.05078125, 44.666015625, 51.28125, 57.896484375, 64.51171875, 71.126953125, 77.7421875, 84.357421875, 90.97265625, 97.587890625, 104.203125, 110.818359375, 117.43359375, 124.048828125, 130.6640625, 137.279296875, 143.89453125, 150.509765625, 157.125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 6.0, 12.0, 11.0, 22.0, 29.0, 34.0, 62.0, 103.0, 184.0, 314.0, 617.0, 1452.0, 3601.0, 10910.0, 43443.0, 256964.0, 628947.0, 75842.0, 17024.0, 5188.0, 1950.0, 816.0, 424.0, 218.0, 123.0, 87.0, 45.0, 49.0, 24.0, 11.0, 10.0, 10.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.28125, -33.82177734375, -32.3623046875, -30.90283203125, -29.443359375, -27.98388671875, -26.5244140625, -25.06494140625, -23.60546875, -22.14599609375, -20.6865234375, -19.22705078125, -17.767578125, -16.30810546875, -14.8486328125, -13.38916015625, -11.9296875, -10.47021484375, -9.0107421875, -7.55126953125, -6.091796875, -4.63232421875, -3.1728515625, -1.71337890625, -0.25390625, 1.20556640625, 2.6650390625, 4.12451171875, 5.583984375, 7.04345703125, 8.5029296875, 9.96240234375, 11.421875, 12.88134765625, 14.3408203125, 15.80029296875, 17.259765625, 18.71923828125, 20.1787109375, 21.63818359375, 23.09765625, 24.55712890625, 26.0166015625, 27.47607421875, 28.935546875, 30.39501953125, 31.8544921875, 33.31396484375, 34.7734375, 36.23291015625, 37.6923828125, 39.15185546875, 40.611328125, 42.07080078125, 43.5302734375, 44.98974609375, 46.44921875, 47.90869140625, 49.3681640625, 50.82763671875, 52.287109375, 53.74658203125, 55.2060546875, 56.66552734375, 58.125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 7.0, 25.0, 24.0, 28.0, 33.0, 40.0, 57.0, 84.0, 91.0, 121.0, 98.0, 88.0, 57.0, 51.0, 32.0, 34.0, 18.0, 16.0, 15.0, 10.0, 7.0, 7.0, 8.0, 3.0, 2.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017974853515625, -0.017531633377075195, -0.01708841323852539, -0.016645193099975586, -0.01620197296142578, -0.015758752822875977, -0.015315532684326172, -0.014872312545776367, -0.014429092407226562, -0.013985872268676758, -0.013542652130126953, -0.013099431991577148, -0.012656211853027344, -0.012212991714477539, -0.011769771575927734, -0.01132655143737793, -0.010883331298828125, -0.01044011116027832, -0.009996891021728516, -0.009553670883178711, -0.009110450744628906, -0.008667230606079102, -0.008224010467529297, -0.007780790328979492, -0.0073375701904296875, -0.006894350051879883, -0.006451129913330078, -0.0060079097747802734, -0.005564689636230469, -0.005121469497680664, -0.004678249359130859, -0.004235029220581055, -0.00379180908203125, -0.0033485889434814453, -0.0029053688049316406, -0.002462148666381836, -0.0020189285278320312, -0.0015757083892822266, -0.0011324882507324219, -0.0006892681121826172, -0.0002460479736328125, 0.0001971721649169922, 0.0006403923034667969, 0.0010836124420166016, 0.0015268325805664062, 0.001970052719116211, 0.0024132728576660156, 0.0028564929962158203, 0.003299713134765625, 0.0037429332733154297, 0.004186153411865234, 0.004629373550415039, 0.005072593688964844, 0.0055158138275146484, 0.005959033966064453, 0.006402254104614258, 0.0068454742431640625, 0.007288694381713867, 0.007731914520263672, 0.008175134658813477, 0.008618354797363281, 0.009061574935913086, 0.00950479507446289, 0.009948015213012695, 0.0103912353515625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 14.0, 10.0, 24.0, 27.0, 69.0, 77.0, 131.0, 208.0, 472.0, 994.0, 2513.0, 8960.0, 59805.0, 787034.0, 164473.0, 17237.0, 3867.0, 1355.0, 590.0, 291.0, 147.0, 82.0, 58.0, 34.0, 22.0, 17.0, 9.0, 10.0, 10.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.0625, -74.96240234375, -72.8623046875, -70.76220703125, -68.662109375, -66.56201171875, -64.4619140625, -62.36181640625, -60.26171875, -58.16162109375, -56.0615234375, -53.96142578125, -51.861328125, -49.76123046875, -47.6611328125, -45.56103515625, -43.4609375, -41.36083984375, -39.2607421875, -37.16064453125, -35.060546875, -32.96044921875, -30.8603515625, -28.76025390625, -26.66015625, -24.56005859375, -22.4599609375, -20.35986328125, -18.259765625, -16.15966796875, -14.0595703125, -11.95947265625, -9.859375, -7.75927734375, -5.6591796875, -3.55908203125, -1.458984375, 0.64111328125, 2.7412109375, 4.84130859375, 6.94140625, 9.04150390625, 11.1416015625, 13.24169921875, 15.341796875, 17.44189453125, 19.5419921875, 21.64208984375, 23.7421875, 25.84228515625, 27.9423828125, 30.04248046875, 32.142578125, 34.24267578125, 36.3427734375, 38.44287109375, 40.54296875, 42.64306640625, 44.7431640625, 46.84326171875, 48.943359375, 51.04345703125, 53.1435546875, 55.24365234375, 57.34375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 13.0, 9.0, 10.0, 16.0, 14.0, 21.0, 21.0, 29.0, 26.0, 39.0, 48.0, 43.0, 37.0, 54.0, 74.0, 76.0, 59.0, 58.0, 54.0, 36.0, 34.0, 30.0, 28.0, 19.0, 25.0, 19.0, 22.0, 5.0, 8.0, 12.0, 9.0, 7.0, 5.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.5625, -38.36669921875, -37.1708984375, -35.97509765625, -34.779296875, -33.58349609375, -32.3876953125, -31.19189453125, -29.99609375, -28.80029296875, -27.6044921875, -26.40869140625, -25.212890625, -24.01708984375, -22.8212890625, -21.62548828125, -20.4296875, -19.23388671875, -18.0380859375, -16.84228515625, -15.646484375, -14.45068359375, -13.2548828125, -12.05908203125, -10.86328125, -9.66748046875, -8.4716796875, -7.27587890625, -6.080078125, -4.88427734375, -3.6884765625, -2.49267578125, -1.296875, -0.10107421875, 1.0947265625, 2.29052734375, 3.486328125, 4.68212890625, 5.8779296875, 7.07373046875, 8.26953125, 9.46533203125, 10.6611328125, 11.85693359375, 13.052734375, 14.24853515625, 15.4443359375, 16.64013671875, 17.8359375, 19.03173828125, 20.2275390625, 21.42333984375, 22.619140625, 23.81494140625, 25.0107421875, 26.20654296875, 27.40234375, 28.59814453125, 29.7939453125, 30.98974609375, 32.185546875, 33.38134765625, 34.5771484375, 35.77294921875, 36.96875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 13.0, 39.0, 50.0, 150.0, 268.0, 217.0, 139.0, 64.0, 26.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-973.2877197265625, -928.6898803710938, -884.092041015625, -839.4942626953125, -794.8963623046875, -750.298583984375, -705.7007446289062, -661.1029052734375, -616.5050659179688, -571.9072265625, -527.3093872070312, -482.7115783691406, -438.1137390136719, -393.5158996582031, -348.9180908203125, -304.32025146484375, -259.722412109375, -215.12457275390625, -170.52674865722656, -125.92892456054688, -81.33108520507812, -36.733245849609375, 7.86456298828125, 52.46240234375, 97.06024169921875, 141.6580810546875, 186.2559051513672, 230.85372924804688, 275.4515686035156, 320.0494079589844, 364.647216796875, 409.24505615234375, 453.843017578125, 498.44085693359375, 543.0386962890625, 587.636474609375, 632.234375, 676.8321533203125, 721.4299926757812, 766.02783203125, 810.6256713867188, 855.2235107421875, 899.8213500976562, 944.419189453125, 989.0169677734375, 1033.6148681640625, 1078.212646484375, 1122.810546875, 1167.4083251953125, 1212.006103515625, 1256.60400390625, 1301.2017822265625, 1345.7996826171875, 1390.3974609375, 1434.995361328125, 1479.5931396484375, 1524.19091796875, 1568.7886962890625, 1613.3865966796875, 1657.984375, 1702.582275390625, 1747.1800537109375, 1791.77783203125, 1836.375732421875, 1880.9736328125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 7.0, 5.0, 9.0, 6.0, 7.0, 9.0, 13.0, 11.0, 19.0, 14.0, 21.0, 25.0, 28.0, 32.0, 27.0, 26.0, 36.0, 35.0, 48.0, 67.0, 62.0, 69.0, 50.0, 43.0, 51.0, 36.0, 30.0, 26.0, 29.0, 18.0, 21.0, 23.0, 17.0, 15.0, 8.0, 20.0, 11.0, 6.0, 3.0, 3.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-561.072265625, -540.8294067382812, -520.5864868164062, -500.3436279296875, -480.1007385253906, -459.85784912109375, -439.614990234375, -419.3721008300781, -399.12921142578125, -378.8863220214844, -358.6434326171875, -338.40057373046875, -318.1576843261719, -297.914794921875, -277.67193603515625, -257.4290466308594, -237.1861572265625, -216.94326782226562, -196.7003936767578, -176.45751953125, -156.21463012695312, -135.97174072265625, -115.72886657714844, -95.48599243164062, -75.24310302734375, -55.000221252441406, -34.75733947753906, -14.514457702636719, 5.728424072265625, 25.97130584716797, 46.21418762207031, 66.45706176757812, 86.69989013671875, 106.9427719116211, 127.18565368652344, 147.42852783203125, 167.67141723632812, 187.914306640625, 208.1571807861328, 228.40005493164062, 248.6429443359375, 268.8858337402344, 289.12872314453125, 309.37158203125, 329.6144714355469, 349.85736083984375, 370.1002197265625, 390.3431091308594, 410.58599853515625, 430.8288879394531, 451.07177734375, 471.31463623046875, 491.5575256347656, 511.8004150390625, 532.0432739257812, 552.2861328125, 572.529052734375, 592.7719116210938, 613.0148315429688, 633.2576904296875, 653.5006103515625, 673.7434692382812, 693.986328125, 714.229248046875, 734.4721069335938]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 10.0, 21.0, 38.0, 53.0, 117.0, 191.0, 393.0, 774.0, 1571.0, 3257.0, 7061.0, 17521.0, 59584.0, 312803.0, 1805955.0, 1642431.0, 263033.0, 51539.0, 15667.0, 6471.0, 2728.0, 1406.0, 691.0, 403.0, 231.0, 124.0, 82.0, 41.0, 26.0, 20.0, 9.0, 11.0, 6.0, 6.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.71875, -31.15771484375, -29.5966796875, -28.03564453125, -26.474609375, -24.91357421875, -23.3525390625, -21.79150390625, -20.23046875, -18.66943359375, -17.1083984375, -15.54736328125, -13.986328125, -12.42529296875, -10.8642578125, -9.30322265625, -7.7421875, -6.18115234375, -4.6201171875, -3.05908203125, -1.498046875, 0.06298828125, 1.6240234375, 3.18505859375, 4.74609375, 6.30712890625, 7.8681640625, 9.42919921875, 10.990234375, 12.55126953125, 14.1123046875, 15.67333984375, 17.234375, 18.79541015625, 20.3564453125, 21.91748046875, 23.478515625, 25.03955078125, 26.6005859375, 28.16162109375, 29.72265625, 31.28369140625, 32.8447265625, 34.40576171875, 35.966796875, 37.52783203125, 39.0888671875, 40.64990234375, 42.2109375, 43.77197265625, 45.3330078125, 46.89404296875, 48.455078125, 50.01611328125, 51.5771484375, 53.13818359375, 54.69921875, 56.26025390625, 57.8212890625, 59.38232421875, 60.943359375, 62.50439453125, 64.0654296875, 65.62646484375, 67.1875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 5.0, 6.0, 17.0, 11.0, 22.0, 39.0, 46.0, 52.0, 62.0, 64.0, 73.0, 87.0, 85.0, 81.0, 65.0, 73.0, 51.0, 49.0, 33.0, 31.0, 9.0, 18.0, 15.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.6875, -41.71484375, -39.7421875, -37.76953125, -35.796875, -33.82421875, -31.8515625, -29.87890625, -27.90625, -25.93359375, -23.9609375, -21.98828125, -20.015625, -18.04296875, -16.0703125, -14.09765625, -12.125, -10.15234375, -8.1796875, -6.20703125, -4.234375, -2.26171875, -0.2890625, 1.68359375, 3.65625, 5.62890625, 7.6015625, 9.57421875, 11.546875, 13.51953125, 15.4921875, 17.46484375, 19.4375, 21.41015625, 23.3828125, 25.35546875, 27.328125, 29.30078125, 31.2734375, 33.24609375, 35.21875, 37.19140625, 39.1640625, 41.13671875, 43.109375, 45.08203125, 47.0546875, 49.02734375, 51.0, 52.97265625, 54.9453125, 56.91796875, 58.890625, 60.86328125, 62.8359375, 64.80859375, 66.78125, 68.75390625, 70.7265625, 72.69921875, 74.671875, 76.64453125, 78.6171875, 80.58984375, 82.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 7.0, 14.0, 19.0, 26.0, 42.0, 75.0, 114.0, 251.0, 429.0, 1048.0, 2956.0, 10096.0, 46659.0, 449647.0, 3437692.0, 203525.0, 29860.0, 7354.0, 2427.0, 1007.0, 428.0, 241.0, 142.0, 85.0, 50.0, 32.0, 20.0, 9.0, 7.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.4375, -106.9169921875, -103.396484375, -99.8759765625, -96.35546875, -92.8349609375, -89.314453125, -85.7939453125, -82.2734375, -78.7529296875, -75.232421875, -71.7119140625, -68.19140625, -64.6708984375, -61.150390625, -57.6298828125, -54.109375, -50.5888671875, -47.068359375, -43.5478515625, -40.02734375, -36.5068359375, -32.986328125, -29.4658203125, -25.9453125, -22.4248046875, -18.904296875, -15.3837890625, -11.86328125, -8.3427734375, -4.822265625, -1.3017578125, 2.21875, 5.7392578125, 9.259765625, 12.7802734375, 16.30078125, 19.8212890625, 23.341796875, 26.8623046875, 30.3828125, 33.9033203125, 37.423828125, 40.9443359375, 44.46484375, 47.9853515625, 51.505859375, 55.0263671875, 58.546875, 62.0673828125, 65.587890625, 69.1083984375, 72.62890625, 76.1494140625, 79.669921875, 83.1904296875, 86.7109375, 90.2314453125, 93.751953125, 97.2724609375, 100.79296875, 104.3134765625, 107.833984375, 111.3544921875, 114.875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 8.0, 8.0, 5.0, 9.0, 19.0, 21.0, 25.0, 28.0, 47.0, 51.0, 59.0, 100.0, 156.0, 253.0, 423.0, 632.0, 684.0, 568.0, 335.0, 198.0, 121.0, 72.0, 53.0, 38.0, 34.0, 25.0, 28.0, 12.0, 12.0, 12.0, 7.0, 7.0, 3.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-85.125, -82.220703125, -79.31640625, -76.412109375, -73.5078125, -70.603515625, -67.69921875, -64.794921875, -61.890625, -58.986328125, -56.08203125, -53.177734375, -50.2734375, -47.369140625, -44.46484375, -41.560546875, -38.65625, -35.751953125, -32.84765625, -29.943359375, -27.0390625, -24.134765625, -21.23046875, -18.326171875, -15.421875, -12.517578125, -9.61328125, -6.708984375, -3.8046875, -0.900390625, 2.00390625, 4.908203125, 7.8125, 10.716796875, 13.62109375, 16.525390625, 19.4296875, 22.333984375, 25.23828125, 28.142578125, 31.046875, 33.951171875, 36.85546875, 39.759765625, 42.6640625, 45.568359375, 48.47265625, 51.376953125, 54.28125, 57.185546875, 60.08984375, 62.994140625, 65.8984375, 68.802734375, 71.70703125, 74.611328125, 77.515625, 80.419921875, 83.32421875, 86.228515625, 89.1328125, 92.037109375, 94.94140625, 97.845703125, 100.75]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 19.0, 21.0, 72.0, 162.0, 287.0, 236.0, 117.0, 51.0, 17.0, 10.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1917.255126953125, -1866.497802734375, -1815.7403564453125, -1764.9830322265625, -1714.2257080078125, -1663.46826171875, -1612.7109375, -1561.95361328125, -1511.1961669921875, -1460.4388427734375, -1409.681396484375, -1358.924072265625, -1308.166748046875, -1257.4093017578125, -1206.6519775390625, -1155.89453125, -1105.13720703125, -1054.3798828125, -1003.6224975585938, -952.8651123046875, -902.1077270507812, -851.350341796875, -800.593017578125, -749.8356323242188, -699.078369140625, -648.3209838867188, -597.5636596679688, -546.8062744140625, -496.04888916015625, -445.2915344238281, -394.5341796875, -343.77679443359375, -293.0194091796875, -242.2620391845703, -191.50466918945312, -140.747314453125, -89.98994445800781, -39.232574462890625, 11.5247802734375, 62.28216552734375, 113.03952026367188, 163.79689025878906, 214.55426025390625, 265.3116149902344, 316.0689697265625, 366.82635498046875, 417.5837097167969, 468.3410949707031, 519.0984497070312, 569.8558349609375, 620.6131591796875, 671.3705444335938, 722.1279296875, 772.88525390625, 823.6426391601562, 874.4000244140625, 925.1573486328125, 975.9147338867188, 1026.672119140625, 1077.429443359375, 1128.186767578125, 1178.9442138671875, 1229.7015380859375, 1280.458984375, 1331.21630859375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 9.0, 7.0, 10.0, 12.0, 14.0, 16.0, 24.0, 29.0, 31.0, 24.0, 36.0, 42.0, 49.0, 58.0, 46.0, 63.0, 52.0, 41.0, 51.0, 52.0, 39.0, 33.0, 29.0, 30.0, 29.0, 34.0, 18.0, 26.0, 19.0, 23.0, 7.0, 3.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-502.78564453125, -487.50390625, -472.22216796875, -456.9404296875, -441.6586608886719, -426.3769226074219, -411.0951843261719, -395.8134460449219, -380.53167724609375, -365.24993896484375, -349.96820068359375, -334.68646240234375, -319.4046936035156, -304.1229553222656, -288.8412170410156, -273.5594787597656, -258.2777404785156, -242.99600219726562, -227.71424865722656, -212.43251037597656, -197.1507568359375, -181.8690185546875, -166.5872802734375, -151.3055419921875, -136.02378845214844, -120.7420425415039, -105.46029663085938, -90.17855834960938, -74.89681243896484, -59.61506652832031, -44.33332824707031, -29.05158233642578, -13.76983642578125, 1.5119075775146484, 16.793651580810547, 32.07539367675781, 47.357139587402344, 62.638885498046875, 77.92062377929688, 93.2023696899414, 108.48411560058594, 123.76586151123047, 139.047607421875, 154.329345703125, 169.611083984375, 184.89283752441406, 200.17457580566406, 215.45632934570312, 230.73806762695312, 246.01980590820312, 261.3015441894531, 276.58331298828125, 291.86505126953125, 307.14678955078125, 322.42852783203125, 337.71026611328125, 352.99200439453125, 368.27374267578125, 383.55548095703125, 398.83721923828125, 414.1189880371094, 429.4007263183594, 444.6824645996094, 459.9642028808594, 475.2459716796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 1.0, 11.0, 10.0, 21.0, 45.0, 65.0, 110.0, 201.0, 360.0, 700.0, 1504.0, 3167.0, 7517.0, 20044.0, 58044.0, 204418.0, 502920.0, 169535.0, 50151.0, 17278.0, 6808.0, 2922.0, 1303.0, 670.0, 337.0, 162.0, 104.0, 53.0, 24.0, 38.0, 10.0, 9.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.5, -83.748046875, -80.99609375, -78.244140625, -75.4921875, -72.740234375, -69.98828125, -67.236328125, -64.484375, -61.732421875, -58.98046875, -56.228515625, -53.4765625, -50.724609375, -47.97265625, -45.220703125, -42.46875, -39.716796875, -36.96484375, -34.212890625, -31.4609375, -28.708984375, -25.95703125, -23.205078125, -20.453125, -17.701171875, -14.94921875, -12.197265625, -9.4453125, -6.693359375, -3.94140625, -1.189453125, 1.5625, 4.314453125, 7.06640625, 9.818359375, 12.5703125, 15.322265625, 18.07421875, 20.826171875, 23.578125, 26.330078125, 29.08203125, 31.833984375, 34.5859375, 37.337890625, 40.08984375, 42.841796875, 45.59375, 48.345703125, 51.09765625, 53.849609375, 56.6015625, 59.353515625, 62.10546875, 64.857421875, 67.609375, 70.361328125, 73.11328125, 75.865234375, 78.6171875, 81.369140625, 84.12109375, 86.873046875, 89.625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 12.0, 13.0, 23.0, 28.0, 25.0, 63.0, 64.0, 68.0, 78.0, 84.0, 93.0, 67.0, 76.0, 80.0, 61.0, 33.0, 34.0, 39.0, 19.0, 19.0, 8.0, 7.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.875, -50.72265625, -48.5703125, -46.41796875, -44.265625, -42.11328125, -39.9609375, -37.80859375, -35.65625, -33.50390625, -31.3515625, -29.19921875, -27.046875, -24.89453125, -22.7421875, -20.58984375, -18.4375, -16.28515625, -14.1328125, -11.98046875, -9.828125, -7.67578125, -5.5234375, -3.37109375, -1.21875, 0.93359375, 3.0859375, 5.23828125, 7.390625, 9.54296875, 11.6953125, 13.84765625, 16.0, 18.15234375, 20.3046875, 22.45703125, 24.609375, 26.76171875, 28.9140625, 31.06640625, 33.21875, 35.37109375, 37.5234375, 39.67578125, 41.828125, 43.98046875, 46.1328125, 48.28515625, 50.4375, 52.58984375, 54.7421875, 56.89453125, 59.046875, 61.19921875, 63.3515625, 65.50390625, 67.65625, 69.80859375, 71.9609375, 74.11328125, 76.265625, 78.41796875, 80.5703125, 82.72265625, 84.875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 12.0, 11.0, 17.0, 22.0, 52.0, 53.0, 83.0, 165.0, 271.0, 515.0, 915.0, 2230.0, 7789.0, 47481.0, 743147.0, 217415.0, 20791.0, 4375.0, 1484.0, 744.0, 380.0, 225.0, 114.0, 79.0, 66.0, 30.0, 24.0, 19.0, 10.0, 7.0, 8.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.875, -150.548828125, -144.22265625, -137.896484375, -131.5703125, -125.244140625, -118.91796875, -112.591796875, -106.265625, -99.939453125, -93.61328125, -87.287109375, -80.9609375, -74.634765625, -68.30859375, -61.982421875, -55.65625, -49.330078125, -43.00390625, -36.677734375, -30.3515625, -24.025390625, -17.69921875, -11.373046875, -5.046875, 1.279296875, 7.60546875, 13.931640625, 20.2578125, 26.583984375, 32.91015625, 39.236328125, 45.5625, 51.888671875, 58.21484375, 64.541015625, 70.8671875, 77.193359375, 83.51953125, 89.845703125, 96.171875, 102.498046875, 108.82421875, 115.150390625, 121.4765625, 127.802734375, 134.12890625, 140.455078125, 146.78125, 153.107421875, 159.43359375, 165.759765625, 172.0859375, 178.412109375, 184.73828125, 191.064453125, 197.390625, 203.716796875, 210.04296875, 216.369140625, 222.6953125, 229.021484375, 235.34765625, 241.673828125, 248.0]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 5.0, 15.0, 22.0, 35.0, 50.0, 64.0, 68.0, 99.0, 93.0, 101.0, 95.0, 86.0, 66.0, 53.0, 46.0, 22.0, 23.0, 19.0, 14.0, 7.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.75, -260.83984375, -250.9296875, -241.01953125, -231.109375, -221.19921875, -211.2890625, -201.37890625, -191.46875, -181.55859375, -171.6484375, -161.73828125, -151.828125, -141.91796875, -132.0078125, -122.09765625, -112.1875, -102.27734375, -92.3671875, -82.45703125, -72.546875, -62.63671875, -52.7265625, -42.81640625, -32.90625, -22.99609375, -13.0859375, -3.17578125, 6.734375, 16.64453125, 26.5546875, 36.46484375, 46.375, 56.28515625, 66.1953125, 76.10546875, 86.015625, 95.92578125, 105.8359375, 115.74609375, 125.65625, 135.56640625, 145.4765625, 155.38671875, 165.296875, 175.20703125, 185.1171875, 195.02734375, 204.9375, 214.84765625, 224.7578125, 234.66796875, 244.578125, 254.48828125, 264.3984375, 274.30859375, 284.21875, 294.12890625, 304.0390625, 313.94921875, 323.859375, 333.76953125, 343.6796875, 353.58984375, 363.5]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 10.0, 12.0, 17.0, 35.0, 49.0, 67.0, 81.0, 144.0, 263.0, 405.0, 666.0, 1376.0, 2832.0, 6746.0, 18861.0, 71853.0, 575286.0, 293068.0, 51585.0, 14607.0, 5568.0, 2364.0, 1095.0, 582.0, 364.0, 223.0, 115.0, 76.0, 46.0, 45.0, 22.0, 25.0, 20.0, 14.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.5625, -41.1845703125, -39.806640625, -38.4287109375, -37.05078125, -35.6728515625, -34.294921875, -32.9169921875, -31.5390625, -30.1611328125, -28.783203125, -27.4052734375, -26.02734375, -24.6494140625, -23.271484375, -21.8935546875, -20.515625, -19.1376953125, -17.759765625, -16.3818359375, -15.00390625, -13.6259765625, -12.248046875, -10.8701171875, -9.4921875, -8.1142578125, -6.736328125, -5.3583984375, -3.98046875, -2.6025390625, -1.224609375, 0.1533203125, 1.53125, 2.9091796875, 4.287109375, 5.6650390625, 7.04296875, 8.4208984375, 9.798828125, 11.1767578125, 12.5546875, 13.9326171875, 15.310546875, 16.6884765625, 18.06640625, 19.4443359375, 20.822265625, 22.2001953125, 23.578125, 24.9560546875, 26.333984375, 27.7119140625, 29.08984375, 30.4677734375, 31.845703125, 33.2236328125, 34.6015625, 35.9794921875, 37.357421875, 38.7353515625, 40.11328125, 41.4912109375, 42.869140625, 44.2470703125, 45.625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 1.0, 7.0, 9.0, 11.0, 9.0, 13.0, 22.0, 20.0, 36.0, 55.0, 87.0, 135.0, 127.0, 138.0, 99.0, 66.0, 39.0, 36.0, 20.0, 10.0, 13.0, 6.0, 5.0, 8.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0214691162109375, -0.02088308334350586, -0.02029705047607422, -0.019711017608642578, -0.019124984741210938, -0.018538951873779297, -0.017952919006347656, -0.017366886138916016, -0.016780853271484375, -0.016194820404052734, -0.015608787536621094, -0.015022754669189453, -0.014436721801757812, -0.013850688934326172, -0.013264656066894531, -0.01267862319946289, -0.01209259033203125, -0.01150655746459961, -0.010920524597167969, -0.010334491729736328, -0.009748458862304688, -0.009162425994873047, -0.008576393127441406, -0.007990360260009766, -0.007404327392578125, -0.006818294525146484, -0.006232261657714844, -0.005646228790283203, -0.0050601959228515625, -0.004474163055419922, -0.0038881301879882812, -0.0033020973205566406, -0.002716064453125, -0.0021300315856933594, -0.0015439987182617188, -0.0009579658508300781, -0.0003719329833984375, 0.00021409988403320312, 0.0008001327514648438, 0.0013861656188964844, 0.001972198486328125, 0.0025582313537597656, 0.0031442642211914062, 0.003730297088623047, 0.0043163299560546875, 0.004902362823486328, 0.005488395690917969, 0.006074428558349609, 0.00666046142578125, 0.007246494293212891, 0.007832527160644531, 0.008418560028076172, 0.009004592895507812, 0.009590625762939453, 0.010176658630371094, 0.010762691497802734, 0.011348724365234375, 0.011934757232666016, 0.012520790100097656, 0.013106822967529297, 0.013692855834960938, 0.014278888702392578, 0.014864921569824219, 0.01545095443725586, 0.0160369873046875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 16.0, 12.0, 26.0, 38.0, 49.0, 80.0, 101.0, 147.0, 211.0, 361.0, 651.0, 1292.0, 2624.0, 6720.0, 20560.0, 86577.0, 606980.0, 253168.0, 46984.0, 12940.0, 4531.0, 1974.0, 1009.0, 535.0, 301.0, 176.0, 147.0, 103.0, 65.0, 43.0, 35.0, 32.0, 15.0, 8.0, 14.0, 8.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.71875, -34.43408203125, -33.1494140625, -31.86474609375, -30.580078125, -29.29541015625, -28.0107421875, -26.72607421875, -25.44140625, -24.15673828125, -22.8720703125, -21.58740234375, -20.302734375, -19.01806640625, -17.7333984375, -16.44873046875, -15.1640625, -13.87939453125, -12.5947265625, -11.31005859375, -10.025390625, -8.74072265625, -7.4560546875, -6.17138671875, -4.88671875, -3.60205078125, -2.3173828125, -1.03271484375, 0.251953125, 1.53662109375, 2.8212890625, 4.10595703125, 5.390625, 6.67529296875, 7.9599609375, 9.24462890625, 10.529296875, 11.81396484375, 13.0986328125, 14.38330078125, 15.66796875, 16.95263671875, 18.2373046875, 19.52197265625, 20.806640625, 22.09130859375, 23.3759765625, 24.66064453125, 25.9453125, 27.22998046875, 28.5146484375, 29.79931640625, 31.083984375, 32.36865234375, 33.6533203125, 34.93798828125, 36.22265625, 37.50732421875, 38.7919921875, 40.07666015625, 41.361328125, 42.64599609375, 43.9306640625, 45.21533203125, 46.5]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 5.0, 12.0, 15.0, 15.0, 25.0, 31.0, 33.0, 29.0, 35.0, 42.0, 55.0, 54.0, 59.0, 65.0, 77.0, 60.0, 62.0, 40.0, 33.0, 45.0, 29.0, 23.0, 13.0, 20.0, 21.0, 14.0, 12.0, 11.0, 7.0, 5.0, 4.0, 6.0, 7.0, 6.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.40625, -27.4072265625, -26.408203125, -25.4091796875, -24.41015625, -23.4111328125, -22.412109375, -21.4130859375, -20.4140625, -19.4150390625, -18.416015625, -17.4169921875, -16.41796875, -15.4189453125, -14.419921875, -13.4208984375, -12.421875, -11.4228515625, -10.423828125, -9.4248046875, -8.42578125, -7.4267578125, -6.427734375, -5.4287109375, -4.4296875, -3.4306640625, -2.431640625, -1.4326171875, -0.43359375, 0.5654296875, 1.564453125, 2.5634765625, 3.5625, 4.5615234375, 5.560546875, 6.5595703125, 7.55859375, 8.5576171875, 9.556640625, 10.5556640625, 11.5546875, 12.5537109375, 13.552734375, 14.5517578125, 15.55078125, 16.5498046875, 17.548828125, 18.5478515625, 19.546875, 20.5458984375, 21.544921875, 22.5439453125, 23.54296875, 24.5419921875, 25.541015625, 26.5400390625, 27.5390625, 28.5380859375, 29.537109375, 30.5361328125, 31.53515625, 32.5341796875, 33.533203125, 34.5322265625, 35.53125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 8.0, 11.0, 18.0, 39.0, 75.0, 119.0, 186.0, 248.0, 123.0, 64.0, 39.0, 23.0, 19.0, 10.0, 6.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1224.50927734375, -1190.79345703125, -1157.07763671875, -1123.3616943359375, -1089.6458740234375, -1055.9300537109375, -1022.2142333984375, -988.4984130859375, -954.7825317382812, -921.0667114257812, -887.350830078125, -853.635009765625, -819.919189453125, -786.2033081054688, -752.4874877929688, -718.7716064453125, -685.0557861328125, -651.3399658203125, -617.6240844726562, -583.9082641601562, -550.1923828125, -516.4765625, -482.7607421875, -449.0448913574219, -415.32904052734375, -381.6131896972656, -347.8973388671875, -314.1815185546875, -280.4656677246094, -246.74981689453125, -213.0339813232422, -179.31814575195312, -145.60223388671875, -111.88639068603516, -78.17054748535156, -44.45470428466797, -10.738861083984375, 22.97698974609375, 56.69282531738281, 90.40866088867188, 124.12451171875, 157.84036254882812, 191.5561981201172, 225.27203369140625, 258.9878845214844, 292.7037353515625, 326.4195556640625, 360.1354064941406, 393.85125732421875, 427.5671081542969, 461.282958984375, 494.998779296875, 528.714599609375, 562.4304809570312, 596.1463012695312, 629.8621826171875, 663.5780029296875, 697.2938232421875, 731.0097045898438, 764.7255249023438, 798.44140625, 832.1572265625, 865.873046875, 899.5888671875, 933.3047485351562]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 8.0, 8.0, 22.0, 16.0, 15.0, 13.0, 19.0, 22.0, 17.0, 29.0, 27.0, 38.0, 37.0, 36.0, 42.0, 69.0, 82.0, 74.0, 56.0, 50.0, 52.0, 32.0, 26.0, 35.0, 33.0, 22.0, 20.0, 18.0, 11.0, 19.0, 6.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-621.338134765625, -599.2092895507812, -577.0805053710938, -554.95166015625, -532.8228149414062, -510.6940002441406, -488.565185546875, -466.43634033203125, -444.3075256347656, -422.1787109375, -400.04986572265625, -377.9210510253906, -355.792236328125, -333.66339111328125, -311.5345764160156, -289.40576171875, -267.27691650390625, -245.14808654785156, -223.01925659179688, -200.89044189453125, -178.76161193847656, -156.63278198242188, -134.50396728515625, -112.37513732910156, -90.24630737304688, -68.11747741699219, -45.98865509033203, -23.859832763671875, -1.7310028076171875, 20.3978271484375, 42.526641845703125, 64.65547180175781, 86.78436279296875, 108.91319274902344, 131.04202270507812, 153.17083740234375, 175.29966735839844, 197.42849731445312, 219.55731201171875, 241.68614196777344, 263.8149719238281, 285.94378662109375, 308.0726318359375, 330.2014465332031, 352.33026123046875, 374.4591064453125, 396.5879211425781, 418.71673583984375, 440.8455810546875, 462.9743957519531, 485.1032409667969, 507.2320556640625, 529.3609008789062, 551.48974609375, 573.6185302734375, 595.7473754882812, 617.876220703125, 640.0050659179688, 662.1338500976562, 684.2626953125, 706.3915405273438, 728.5203857421875, 750.649169921875, 772.7780151367188, 794.9067993164062]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 10.0, 10.0, 10.0, 21.0, 30.0, 35.0, 57.0, 99.0, 146.0, 226.0, 394.0, 706.0, 1249.0, 2478.0, 5664.0, 15421.0, 67333.0, 658834.0, 2894341.0, 470632.0, 53549.0, 13219.0, 4880.0, 2151.0, 1158.0, 591.0, 387.0, 193.0, 152.0, 95.0, 67.0, 40.0, 31.0, 21.0, 12.0, 8.0, 10.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-65.4375, -63.287109375, -61.13671875, -58.986328125, -56.8359375, -54.685546875, -52.53515625, -50.384765625, -48.234375, -46.083984375, -43.93359375, -41.783203125, -39.6328125, -37.482421875, -35.33203125, -33.181640625, -31.03125, -28.880859375, -26.73046875, -24.580078125, -22.4296875, -20.279296875, -18.12890625, -15.978515625, -13.828125, -11.677734375, -9.52734375, -7.376953125, -5.2265625, -3.076171875, -0.92578125, 1.224609375, 3.375, 5.525390625, 7.67578125, 9.826171875, 11.9765625, 14.126953125, 16.27734375, 18.427734375, 20.578125, 22.728515625, 24.87890625, 27.029296875, 29.1796875, 31.330078125, 33.48046875, 35.630859375, 37.78125, 39.931640625, 42.08203125, 44.232421875, 46.3828125, 48.533203125, 50.68359375, 52.833984375, 54.984375, 57.134765625, 59.28515625, 61.435546875, 63.5859375, 65.736328125, 67.88671875, 70.037109375, 72.1875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 5.0, 14.0, 11.0, 11.0, 16.0, 22.0, 31.0, 45.0, 51.0, 44.0, 49.0, 59.0, 67.0, 60.0, 63.0, 75.0, 58.0, 55.0, 37.0, 45.0, 49.0, 25.0, 25.0, 20.0, 15.0, 11.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.875, -52.3740234375, -50.873046875, -49.3720703125, -47.87109375, -46.3701171875, -44.869140625, -43.3681640625, -41.8671875, -40.3662109375, -38.865234375, -37.3642578125, -35.86328125, -34.3623046875, -32.861328125, -31.3603515625, -29.859375, -28.3583984375, -26.857421875, -25.3564453125, -23.85546875, -22.3544921875, -20.853515625, -19.3525390625, -17.8515625, -16.3505859375, -14.849609375, -13.3486328125, -11.84765625, -10.3466796875, -8.845703125, -7.3447265625, -5.84375, -4.3427734375, -2.841796875, -1.3408203125, 0.16015625, 1.6611328125, 3.162109375, 4.6630859375, 6.1640625, 7.6650390625, 9.166015625, 10.6669921875, 12.16796875, 13.6689453125, 15.169921875, 16.6708984375, 18.171875, 19.6728515625, 21.173828125, 22.6748046875, 24.17578125, 25.6767578125, 27.177734375, 28.6787109375, 30.1796875, 31.6806640625, 33.181640625, 34.6826171875, 36.18359375, 37.6845703125, 39.185546875, 40.6865234375, 42.1875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 10.0, 16.0, 25.0, 32.0, 47.0, 73.0, 106.0, 153.0, 236.0, 440.0, 1419.0, 21920.0, 4090630.0, 75264.0, 2581.0, 611.0, 238.0, 156.0, 120.0, 63.0, 51.0, 41.0, 20.0, 11.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-364.75, -353.57421875, -342.3984375, -331.22265625, -320.046875, -308.87109375, -297.6953125, -286.51953125, -275.34375, -264.16796875, -252.9921875, -241.81640625, -230.640625, -219.46484375, -208.2890625, -197.11328125, -185.9375, -174.76171875, -163.5859375, -152.41015625, -141.234375, -130.05859375, -118.8828125, -107.70703125, -96.53125, -85.35546875, -74.1796875, -63.00390625, -51.828125, -40.65234375, -29.4765625, -18.30078125, -7.125, 4.05078125, 15.2265625, 26.40234375, 37.578125, 48.75390625, 59.9296875, 71.10546875, 82.28125, 93.45703125, 104.6328125, 115.80859375, 126.984375, 138.16015625, 149.3359375, 160.51171875, 171.6875, 182.86328125, 194.0390625, 205.21484375, 216.390625, 227.56640625, 238.7421875, 249.91796875, 261.09375, 272.26953125, 283.4453125, 294.62109375, 305.796875, 316.97265625, 328.1484375, 339.32421875, 350.5]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 11.0, 11.0, 28.0, 48.0, 118.0, 335.0, 1260.0, 1639.0, 409.0, 128.0, 43.0, 24.0, 16.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-291.0, -282.71484375, -274.4296875, -266.14453125, -257.859375, -249.57421875, -241.2890625, -233.00390625, -224.71875, -216.43359375, -208.1484375, -199.86328125, -191.578125, -183.29296875, -175.0078125, -166.72265625, -158.4375, -150.15234375, -141.8671875, -133.58203125, -125.296875, -117.01171875, -108.7265625, -100.44140625, -92.15625, -83.87109375, -75.5859375, -67.30078125, -59.015625, -50.73046875, -42.4453125, -34.16015625, -25.875, -17.58984375, -9.3046875, -1.01953125, 7.265625, 15.55078125, 23.8359375, 32.12109375, 40.40625, 48.69140625, 56.9765625, 65.26171875, 73.546875, 81.83203125, 90.1171875, 98.40234375, 106.6875, 114.97265625, 123.2578125, 131.54296875, 139.828125, 148.11328125, 156.3984375, 164.68359375, 172.96875, 181.25390625, 189.5390625, 197.82421875, 206.109375, 214.39453125, 222.6796875, 230.96484375, 239.25]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 14.0, 30.0, 58.0, 85.0, 193.0, 276.0, 188.0, 72.0, 34.0, 17.0, 13.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1509.131591796875, -1458.294921875, -1407.4583740234375, -1356.6217041015625, -1305.78515625, -1254.948486328125, -1204.11181640625, -1153.2752685546875, -1102.4385986328125, -1051.6019287109375, -1000.765380859375, -949.9287109375, -899.0921020507812, -848.2554931640625, -797.4188842773438, -746.582275390625, -695.7456665039062, -644.9090576171875, -594.0724487304688, -543.23583984375, -492.399169921875, -441.56256103515625, -390.7259521484375, -339.8893127441406, -289.0527038574219, -238.21607971191406, -187.37945556640625, -136.5428466796875, -85.70622253417969, -34.869598388671875, 15.967010498046875, 66.80364990234375, 117.6402587890625, 168.4768829345703, 219.31350708007812, 270.1501159667969, 320.98675537109375, 371.8233642578125, 422.65997314453125, 473.4966125488281, 524.333251953125, 575.1698608398438, 626.0064697265625, 676.8431396484375, 727.6797485351562, 778.516357421875, 829.3529663085938, 880.1895751953125, 931.0261840820312, 981.86279296875, 1032.699462890625, 1083.5360107421875, 1134.3726806640625, 1185.209228515625, 1236.0458984375, 1286.882568359375, 1337.7191162109375, 1388.5557861328125, 1439.392333984375, 1490.22900390625, 1541.0655517578125, 1591.9022216796875, 1642.73876953125, 1693.575439453125, 1744.412109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 4.0, 5.0, 11.0, 9.0, 8.0, 20.0, 27.0, 27.0, 25.0, 36.0, 45.0, 41.0, 49.0, 52.0, 56.0, 55.0, 53.0, 60.0, 56.0, 60.0, 54.0, 44.0, 35.0, 36.0, 33.0, 22.0, 21.0, 16.0, 16.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-589.2180786132812, -570.8192138671875, -552.4203491210938, -534.0214233398438, -515.62255859375, -497.22369384765625, -478.8248291015625, -460.42596435546875, -442.0270690917969, -423.6282043457031, -405.22930908203125, -386.8304443359375, -368.43157958984375, -350.0326843261719, -331.6338195800781, -313.23492431640625, -294.8360595703125, -276.43719482421875, -258.0382995605469, -239.63943481445312, -221.2405548095703, -202.8416748046875, -184.44281005859375, -166.04393005371094, -147.64505004882812, -129.2461700439453, -110.84729766845703, -92.44842529296875, -74.04954528808594, -55.650665283203125, -37.251792907714844, -18.852920532226562, -0.4541015625, 17.944774627685547, 36.343650817871094, 54.74252700805664, 73.14140319824219, 91.540283203125, 109.93915557861328, 128.33802795410156, 146.73690795898438, 165.1357879638672, 183.53466796875, 201.93353271484375, 220.33241271972656, 238.73129272460938, 257.1301574707031, 275.529052734375, 293.92791748046875, 312.3267822265625, 330.7256774902344, 349.1245422363281, 367.5234375, 385.92230224609375, 404.3211669921875, 422.72003173828125, 441.1189270019531, 459.5177917480469, 477.91668701171875, 496.3155517578125, 514.7144165039062, 533.11328125, 551.51220703125, 569.9110717773438, 588.3099365234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 11.0, 14.0, 28.0, 35.0, 65.0, 75.0, 104.0, 173.0, 264.0, 381.0, 675.0, 1009.0, 1639.0, 2715.0, 4614.0, 8333.0, 15642.0, 30873.0, 64199.0, 143086.0, 292468.0, 254336.0, 117494.0, 53493.0, 25908.0, 13289.0, 7105.0, 4119.0, 2413.0, 1435.0, 900.0, 555.0, 354.0, 256.0, 177.0, 119.0, 55.0, 44.0, 26.0, 20.0, 13.0, 9.0, 11.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-44.46875, -43.1162109375, -41.763671875, -40.4111328125, -39.05859375, -37.7060546875, -36.353515625, -35.0009765625, -33.6484375, -32.2958984375, -30.943359375, -29.5908203125, -28.23828125, -26.8857421875, -25.533203125, -24.1806640625, -22.828125, -21.4755859375, -20.123046875, -18.7705078125, -17.41796875, -16.0654296875, -14.712890625, -13.3603515625, -12.0078125, -10.6552734375, -9.302734375, -7.9501953125, -6.59765625, -5.2451171875, -3.892578125, -2.5400390625, -1.1875, 0.1650390625, 1.517578125, 2.8701171875, 4.22265625, 5.5751953125, 6.927734375, 8.2802734375, 9.6328125, 10.9853515625, 12.337890625, 13.6904296875, 15.04296875, 16.3955078125, 17.748046875, 19.1005859375, 20.453125, 21.8056640625, 23.158203125, 24.5107421875, 25.86328125, 27.2158203125, 28.568359375, 29.9208984375, 31.2734375, 32.6259765625, 33.978515625, 35.3310546875, 36.68359375, 38.0361328125, 39.388671875, 40.7412109375, 42.09375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 5.0, 6.0, 8.0, 8.0, 12.0, 10.0, 13.0, 19.0, 23.0, 37.0, 35.0, 50.0, 48.0, 57.0, 55.0, 51.0, 62.0, 53.0, 59.0, 56.0, 61.0, 50.0, 36.0, 36.0, 30.0, 26.0, 22.0, 26.0, 6.0, 18.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.15625, -53.5771484375, -51.998046875, -50.4189453125, -48.83984375, -47.2607421875, -45.681640625, -44.1025390625, -42.5234375, -40.9443359375, -39.365234375, -37.7861328125, -36.20703125, -34.6279296875, -33.048828125, -31.4697265625, -29.890625, -28.3115234375, -26.732421875, -25.1533203125, -23.57421875, -21.9951171875, -20.416015625, -18.8369140625, -17.2578125, -15.6787109375, -14.099609375, -12.5205078125, -10.94140625, -9.3623046875, -7.783203125, -6.2041015625, -4.625, -3.0458984375, -1.466796875, 0.1123046875, 1.69140625, 3.2705078125, 4.849609375, 6.4287109375, 8.0078125, 9.5869140625, 11.166015625, 12.7451171875, 14.32421875, 15.9033203125, 17.482421875, 19.0615234375, 20.640625, 22.2197265625, 23.798828125, 25.3779296875, 26.95703125, 28.5361328125, 30.115234375, 31.6943359375, 33.2734375, 34.8525390625, 36.431640625, 38.0107421875, 39.58984375, 41.1689453125, 42.748046875, 44.3271484375, 45.90625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 3.0, 8.0, 5.0, 19.0, 22.0, 21.0, 46.0, 83.0, 199.0, 442.0, 1152.0, 3208.0, 11024.0, 54963.0, 610550.0, 314279.0, 39696.0, 8518.0, 2588.0, 927.0, 388.0, 181.0, 85.0, 46.0, 35.0, 25.0, 12.0, 3.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.0, -116.814453125, -112.62890625, -108.443359375, -104.2578125, -100.072265625, -95.88671875, -91.701171875, -87.515625, -83.330078125, -79.14453125, -74.958984375, -70.7734375, -66.587890625, -62.40234375, -58.216796875, -54.03125, -49.845703125, -45.66015625, -41.474609375, -37.2890625, -33.103515625, -28.91796875, -24.732421875, -20.546875, -16.361328125, -12.17578125, -7.990234375, -3.8046875, 0.380859375, 4.56640625, 8.751953125, 12.9375, 17.123046875, 21.30859375, 25.494140625, 29.6796875, 33.865234375, 38.05078125, 42.236328125, 46.421875, 50.607421875, 54.79296875, 58.978515625, 63.1640625, 67.349609375, 71.53515625, 75.720703125, 79.90625, 84.091796875, 88.27734375, 92.462890625, 96.6484375, 100.833984375, 105.01953125, 109.205078125, 113.390625, 117.576171875, 121.76171875, 125.947265625, 130.1328125, 134.318359375, 138.50390625, 142.689453125, 146.875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 7.0, 9.0, 8.0, 13.0, 28.0, 28.0, 38.0, 32.0, 46.0, 45.0, 51.0, 64.0, 58.0, 52.0, 62.0, 78.0, 46.0, 48.0, 44.0, 43.0, 28.0, 32.0, 36.0, 13.0, 22.0, 6.0, 12.0, 5.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-200.125, -194.01171875, -187.8984375, -181.78515625, -175.671875, -169.55859375, -163.4453125, -157.33203125, -151.21875, -145.10546875, -138.9921875, -132.87890625, -126.765625, -120.65234375, -114.5390625, -108.42578125, -102.3125, -96.19921875, -90.0859375, -83.97265625, -77.859375, -71.74609375, -65.6328125, -59.51953125, -53.40625, -47.29296875, -41.1796875, -35.06640625, -28.953125, -22.83984375, -16.7265625, -10.61328125, -4.5, 1.61328125, 7.7265625, 13.83984375, 19.953125, 26.06640625, 32.1796875, 38.29296875, 44.40625, 50.51953125, 56.6328125, 62.74609375, 68.859375, 74.97265625, 81.0859375, 87.19921875, 93.3125, 99.42578125, 105.5390625, 111.65234375, 117.765625, 123.87890625, 129.9921875, 136.10546875, 142.21875, 148.33203125, 154.4453125, 160.55859375, 166.671875, 172.78515625, 178.8984375, 185.01171875, 191.125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 12.0, 12.0, 21.0, 21.0, 41.0, 54.0, 109.0, 205.0, 425.0, 997.0, 2590.0, 8855.0, 35096.0, 166522.0, 641214.0, 148259.0, 31623.0, 8108.0, 2548.0, 961.0, 383.0, 212.0, 103.0, 58.0, 37.0, 24.0, 17.0, 15.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.1875, -30.226806640625, -29.26611328125, -28.305419921875, -27.3447265625, -26.384033203125, -25.42333984375, -24.462646484375, -23.501953125, -22.541259765625, -21.58056640625, -20.619873046875, -19.6591796875, -18.698486328125, -17.73779296875, -16.777099609375, -15.81640625, -14.855712890625, -13.89501953125, -12.934326171875, -11.9736328125, -11.012939453125, -10.05224609375, -9.091552734375, -8.130859375, -7.170166015625, -6.20947265625, -5.248779296875, -4.2880859375, -3.327392578125, -2.36669921875, -1.406005859375, -0.4453125, 0.515380859375, 1.47607421875, 2.436767578125, 3.3974609375, 4.358154296875, 5.31884765625, 6.279541015625, 7.240234375, 8.200927734375, 9.16162109375, 10.122314453125, 11.0830078125, 12.043701171875, 13.00439453125, 13.965087890625, 14.92578125, 15.886474609375, 16.84716796875, 17.807861328125, 18.7685546875, 19.729248046875, 20.68994140625, 21.650634765625, 22.611328125, 23.572021484375, 24.53271484375, 25.493408203125, 26.4541015625, 27.414794921875, 28.37548828125, 29.336181640625, 30.296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 2.0, 6.0, 12.0, 10.0, 13.0, 13.0, 19.0, 25.0, 33.0, 36.0, 53.0, 61.0, 74.0, 72.0, 81.0, 94.0, 71.0, 76.0, 44.0, 54.0, 28.0, 27.0, 26.0, 15.0, 9.0, 9.0, 8.0, 7.0, 5.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01110076904296875, -0.010815560817718506, -0.010530352592468262, -0.010245144367218018, -0.009959936141967773, -0.00967472791671753, -0.009389519691467285, -0.009104311466217041, -0.008819103240966797, -0.008533895015716553, -0.008248686790466309, -0.007963478565216064, -0.00767827033996582, -0.007393062114715576, -0.007107853889465332, -0.006822645664215088, -0.006537437438964844, -0.0062522292137146, -0.0059670209884643555, -0.005681812763214111, -0.005396604537963867, -0.005111396312713623, -0.004826188087463379, -0.004540979862213135, -0.004255771636962891, -0.0039705634117126465, -0.0036853551864624023, -0.003400146961212158, -0.003114938735961914, -0.00282973051071167, -0.0025445222854614258, -0.0022593140602111816, -0.0019741058349609375, -0.0016888976097106934, -0.0014036893844604492, -0.001118481159210205, -0.0008332729339599609, -0.0005480647087097168, -0.00026285648345947266, 2.2351741790771484e-05, 0.0003075599670410156, 0.0005927681922912598, 0.0008779764175415039, 0.001163184642791748, 0.0014483928680419922, 0.0017336010932922363, 0.0020188093185424805, 0.0023040175437927246, 0.0025892257690429688, 0.002874433994293213, 0.003159642219543457, 0.003444850444793701, 0.0037300586700439453, 0.0040152668952941895, 0.004300475120544434, 0.004585683345794678, 0.004870891571044922, 0.005156099796295166, 0.00544130802154541, 0.005726516246795654, 0.0060117244720458984, 0.006296932697296143, 0.006582140922546387, 0.006867349147796631, 0.007152557373046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 13.0, 9.0, 25.0, 38.0, 82.0, 141.0, 243.0, 581.0, 1483.0, 4299.0, 16100.0, 77608.0, 567917.0, 306886.0, 55340.0, 12047.0, 3483.0, 1236.0, 516.0, 239.0, 118.0, 57.0, 32.0, 23.0, 14.0, 6.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.125, -27.0390625, -25.953125, -24.8671875, -23.78125, -22.6953125, -21.609375, -20.5234375, -19.4375, -18.3515625, -17.265625, -16.1796875, -15.09375, -14.0078125, -12.921875, -11.8359375, -10.75, -9.6640625, -8.578125, -7.4921875, -6.40625, -5.3203125, -4.234375, -3.1484375, -2.0625, -0.9765625, 0.109375, 1.1953125, 2.28125, 3.3671875, 4.453125, 5.5390625, 6.625, 7.7109375, 8.796875, 9.8828125, 10.96875, 12.0546875, 13.140625, 14.2265625, 15.3125, 16.3984375, 17.484375, 18.5703125, 19.65625, 20.7421875, 21.828125, 22.9140625, 24.0, 25.0859375, 26.171875, 27.2578125, 28.34375, 29.4296875, 30.515625, 31.6015625, 32.6875, 33.7734375, 34.859375, 35.9453125, 37.03125, 38.1171875, 39.203125, 40.2890625, 41.375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 13.0, 13.0, 18.0, 28.0, 35.0, 42.0, 61.0, 65.0, 80.0, 70.0, 73.0, 96.0, 53.0, 76.0, 48.0, 50.0, 34.0, 39.0, 20.0, 23.0, 13.0, 7.0, 9.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-42.21875, -41.120361328125, -40.02197265625, -38.923583984375, -37.8251953125, -36.726806640625, -35.62841796875, -34.530029296875, -33.431640625, -32.333251953125, -31.23486328125, -30.136474609375, -29.0380859375, -27.939697265625, -26.84130859375, -25.742919921875, -24.64453125, -23.546142578125, -22.44775390625, -21.349365234375, -20.2509765625, -19.152587890625, -18.05419921875, -16.955810546875, -15.857421875, -14.759033203125, -13.66064453125, -12.562255859375, -11.4638671875, -10.365478515625, -9.26708984375, -8.168701171875, -7.0703125, -5.971923828125, -4.87353515625, -3.775146484375, -2.6767578125, -1.578369140625, -0.47998046875, 0.618408203125, 1.716796875, 2.815185546875, 3.91357421875, 5.011962890625, 6.1103515625, 7.208740234375, 8.30712890625, 9.405517578125, 10.50390625, 11.602294921875, 12.70068359375, 13.799072265625, 14.8974609375, 15.995849609375, 17.09423828125, 18.192626953125, 19.291015625, 20.389404296875, 21.48779296875, 22.586181640625, 23.6845703125, 24.782958984375, 25.88134765625, 26.979736328125, 28.078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 10.0, 25.0, 56.0, 139.0, 359.0, 263.0, 79.0, 40.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1960.0020751953125, -1916.3197021484375, -1872.637451171875, -1828.955078125, -1785.272705078125, -1741.5904541015625, -1697.9080810546875, -1654.225830078125, -1610.54345703125, -1566.861083984375, -1523.1788330078125, -1479.4964599609375, -1435.8140869140625, -1392.1318359375, -1348.449462890625, -1304.76708984375, -1261.084716796875, -1217.40234375, -1173.7200927734375, -1130.0377197265625, -1086.3553466796875, -1042.673095703125, -998.99072265625, -955.3084106445312, -911.6260986328125, -867.9437866210938, -824.2614135742188, -780.5791015625, -736.8967895507812, -693.2144775390625, -649.5321044921875, -605.8497924804688, -562.16748046875, -518.4851684570312, -474.8028259277344, -431.1204833984375, -387.43817138671875, -343.7558288574219, -300.073486328125, -256.39117431640625, -212.70883178710938, -169.02650451660156, -125.34416961669922, -81.66183471679688, -37.97950744628906, 5.70281982421875, 49.385162353515625, 93.06747436523438, 136.74981689453125, 180.43214416503906, 224.11447143554688, 267.79681396484375, 311.4791259765625, 355.1614685058594, 398.84381103515625, 442.526123046875, 486.2084655761719, 529.8908081054688, 573.5731201171875, 617.2554931640625, 660.9378051757812, 704.6201171875, 748.302490234375, 791.9847412109375, 835.6671142578125]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 9.0, 7.0, 4.0, 9.0, 4.0, 5.0, 13.0, 9.0, 16.0, 17.0, 12.0, 22.0, 24.0, 25.0, 25.0, 30.0, 37.0, 45.0, 50.0, 79.0, 71.0, 82.0, 48.0, 40.0, 38.0, 35.0, 24.0, 34.0, 17.0, 28.0, 22.0, 20.0, 17.0, 13.0, 8.0, 16.0, 8.0, 4.0, 5.0, 5.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-676.45458984375, -656.978515625, -637.5025024414062, -618.0264282226562, -598.5504150390625, -579.0743408203125, -559.5983276367188, -540.1222534179688, -520.646240234375, -501.1701965332031, -481.69415283203125, -462.2181091308594, -442.7420654296875, -423.2659912109375, -403.7899475097656, -384.31390380859375, -364.83782958984375, -345.3617858886719, -325.8857421875, -306.4096984863281, -286.93365478515625, -267.45758056640625, -247.98153686523438, -228.5054931640625, -209.02944946289062, -189.55340576171875, -170.07736206054688, -150.60130310058594, -131.12525939941406, -111.64921569824219, -92.17316436767578, -72.69711303710938, -53.2210693359375, -33.74502182006836, -14.268974304199219, 5.207073211669922, 24.683120727539062, 44.15916442871094, 63.635215759277344, 83.11126708984375, 102.58731079101562, 122.0633544921875, 141.53939819335938, 161.0154571533203, 180.4915008544922, 199.96754455566406, 219.443603515625, 238.91964721679688, 258.39569091796875, 277.8717346191406, 297.3477783203125, 316.8238220214844, 336.29986572265625, 355.77593994140625, 375.2519836425781, 394.72802734375, 414.2040710449219, 433.68011474609375, 453.1561584472656, 472.6322021484375, 492.1082763671875, 511.58428955078125, 531.0603637695312, 550.536376953125, 570.012451171875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 5.0, 4.0, 8.0, 8.0, 16.0, 17.0, 18.0, 25.0, 35.0, 40.0, 75.0, 140.0, 292.0, 961.0, 3287.0, 16414.0, 305575.0, 3542003.0, 303306.0, 16907.0, 3377.0, 988.0, 350.0, 147.0, 59.0, 47.0, 32.0, 28.0, 21.0, 14.0, 9.0, 18.0, 13.0, 6.0, 3.0, 8.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.5625, -105.1162109375, -101.669921875, -98.2236328125, -94.77734375, -91.3310546875, -87.884765625, -84.4384765625, -80.9921875, -77.5458984375, -74.099609375, -70.6533203125, -67.20703125, -63.7607421875, -60.314453125, -56.8681640625, -53.421875, -49.9755859375, -46.529296875, -43.0830078125, -39.63671875, -36.1904296875, -32.744140625, -29.2978515625, -25.8515625, -22.4052734375, -18.958984375, -15.5126953125, -12.06640625, -8.6201171875, -5.173828125, -1.7275390625, 1.71875, 5.1650390625, 8.611328125, 12.0576171875, 15.50390625, 18.9501953125, 22.396484375, 25.8427734375, 29.2890625, 32.7353515625, 36.181640625, 39.6279296875, 43.07421875, 46.5205078125, 49.966796875, 53.4130859375, 56.859375, 60.3056640625, 63.751953125, 67.1982421875, 70.64453125, 74.0908203125, 77.537109375, 80.9833984375, 84.4296875, 87.8759765625, 91.322265625, 94.7685546875, 98.21484375, 101.6611328125, 105.107421875, 108.5537109375, 112.0]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 0.0, 4.0, 7.0, 6.0, 4.0, 9.0, 10.0, 11.0, 6.0, 16.0, 12.0, 15.0, 19.0, 24.0, 29.0, 39.0, 44.0, 42.0, 46.0, 52.0, 49.0, 33.0, 40.0, 53.0, 51.0, 41.0, 32.0, 47.0, 34.0, 39.0, 32.0, 25.0, 19.0, 24.0, 10.0, 14.0, 16.0, 13.0, 9.0, 6.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.78125, -39.51806640625, -38.2548828125, -36.99169921875, -35.728515625, -34.46533203125, -33.2021484375, -31.93896484375, -30.67578125, -29.41259765625, -28.1494140625, -26.88623046875, -25.623046875, -24.35986328125, -23.0966796875, -21.83349609375, -20.5703125, -19.30712890625, -18.0439453125, -16.78076171875, -15.517578125, -14.25439453125, -12.9912109375, -11.72802734375, -10.46484375, -9.20166015625, -7.9384765625, -6.67529296875, -5.412109375, -4.14892578125, -2.8857421875, -1.62255859375, -0.359375, 0.90380859375, 2.1669921875, 3.43017578125, 4.693359375, 5.95654296875, 7.2197265625, 8.48291015625, 9.74609375, 11.00927734375, 12.2724609375, 13.53564453125, 14.798828125, 16.06201171875, 17.3251953125, 18.58837890625, 19.8515625, 21.11474609375, 22.3779296875, 23.64111328125, 24.904296875, 26.16748046875, 27.4306640625, 28.69384765625, 29.95703125, 31.22021484375, 32.4833984375, 33.74658203125, 35.009765625, 36.27294921875, 37.5361328125, 38.79931640625, 40.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 12.0, 16.0, 68.0, 110.0, 256.0, 855.0, 13677.0, 4151282.0, 26451.0, 1022.0, 281.0, 128.0, 55.0, 37.0, 19.0, 14.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-430.25, -416.17578125, -402.1015625, -388.02734375, -373.953125, -359.87890625, -345.8046875, -331.73046875, -317.65625, -303.58203125, -289.5078125, -275.43359375, -261.359375, -247.28515625, -233.2109375, -219.13671875, -205.0625, -190.98828125, -176.9140625, -162.83984375, -148.765625, -134.69140625, -120.6171875, -106.54296875, -92.46875, -78.39453125, -64.3203125, -50.24609375, -36.171875, -22.09765625, -8.0234375, 6.05078125, 20.125, 34.19921875, 48.2734375, 62.34765625, 76.421875, 90.49609375, 104.5703125, 118.64453125, 132.71875, 146.79296875, 160.8671875, 174.94140625, 189.015625, 203.08984375, 217.1640625, 231.23828125, 245.3125, 259.38671875, 273.4609375, 287.53515625, 301.609375, 315.68359375, 329.7578125, 343.83203125, 357.90625, 371.98046875, 386.0546875, 400.12890625, 414.203125, 428.27734375, 442.3515625, 456.42578125, 470.5]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 12.0, 29.0, 47.0, 99.0, 396.0, 1714.0, 1348.0, 284.0, 81.0, 35.0, 13.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.25, -254.7265625, -246.203125, -237.6796875, -229.15625, -220.6328125, -212.109375, -203.5859375, -195.0625, -186.5390625, -178.015625, -169.4921875, -160.96875, -152.4453125, -143.921875, -135.3984375, -126.875, -118.3515625, -109.828125, -101.3046875, -92.78125, -84.2578125, -75.734375, -67.2109375, -58.6875, -50.1640625, -41.640625, -33.1171875, -24.59375, -16.0703125, -7.546875, 0.9765625, 9.5, 18.0234375, 26.546875, 35.0703125, 43.59375, 52.1171875, 60.640625, 69.1640625, 77.6875, 86.2109375, 94.734375, 103.2578125, 111.78125, 120.3046875, 128.828125, 137.3515625, 145.875, 154.3984375, 162.921875, 171.4453125, 179.96875, 188.4921875, 197.015625, 205.5390625, 214.0625, 222.5859375, 231.109375, 239.6328125, 248.15625, 256.6796875, 265.203125, 273.7265625, 282.25]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 17.0, 19.0, 15.0, 41.0, 43.0, 80.0, 132.0, 179.0, 143.0, 113.0, 99.0, 37.0, 29.0, 14.0, 12.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-973.7903442382812, -947.4930419921875, -921.1957397460938, -894.8983764648438, -868.60107421875, -842.3037719726562, -816.0064697265625, -789.7091064453125, -763.4118041992188, -737.114501953125, -710.8171997070312, -684.5198364257812, -658.2225341796875, -631.9252319335938, -605.6279296875, -579.33056640625, -553.0333251953125, -526.7360229492188, -500.4386901855469, -474.1413879394531, -447.84405517578125, -421.5467529296875, -395.24945068359375, -368.9521179199219, -342.65478515625, -316.35748291015625, -290.0601501464844, -263.7628479003906, -237.46551513671875, -211.168212890625, -184.8708953857422, -158.57357788085938, -132.2762451171875, -105.97892761230469, -79.68161010742188, -53.384300231933594, -27.08698272705078, -0.7896728515625, 25.507644653320312, 51.804962158203125, 78.10227966308594, 104.39959716796875, 130.69691467285156, 156.99423217773438, 183.29153442382812, 209.58885192871094, 235.88616943359375, 262.1834716796875, 288.4808044433594, 314.7781066894531, 341.075439453125, 367.37274169921875, 393.6700744628906, 419.9673767089844, 446.26470947265625, 472.56201171875, 498.85931396484375, 525.1566162109375, 551.4539184570312, 577.7512817382812, 604.048583984375, 630.3458862304688, 656.6431884765625, 682.9405517578125, 709.2378540039062]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 4.0, 1.0, 6.0, 3.0, 6.0, 8.0, 4.0, 9.0, 9.0, 14.0, 17.0, 11.0, 27.0, 30.0, 29.0, 26.0, 33.0, 33.0, 28.0, 34.0, 32.0, 49.0, 47.0, 42.0, 41.0, 44.0, 31.0, 42.0, 32.0, 35.0, 34.0, 16.0, 29.0, 24.0, 17.0, 17.0, 20.0, 17.0, 22.0, 9.0, 16.0, 9.0, 3.0, 12.0, 7.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-434.8672180175781, -421.15618896484375, -407.44512939453125, -393.73406982421875, -380.0230407714844, -366.31201171875, -352.6009521484375, -338.889892578125, -325.1788635253906, -311.46783447265625, -297.75677490234375, -284.04571533203125, -270.3346862792969, -256.6236572265625, -242.91259765625, -229.20155334472656, -215.49050903320312, -201.7794647216797, -188.06842041015625, -174.3573760986328, -160.64633178710938, -146.93528747558594, -133.2242431640625, -119.51319885253906, -105.80215454101562, -92.09111022949219, -78.38006591796875, -64.66902160644531, -50.957977294921875, -37.24693298339844, -23.535888671875, -9.824844360351562, 3.88623046875, 17.597274780273438, 31.308319091796875, 45.01936340332031, 58.73040771484375, 72.44145202636719, 86.15249633789062, 99.86354064941406, 113.5745849609375, 127.28562927246094, 140.99667358398438, 154.7077178955078, 168.41876220703125, 182.1298065185547, 195.84085083007812, 209.55189514160156, 223.262939453125, 236.97398376464844, 250.68502807617188, 264.39605712890625, 278.10711669921875, 291.81817626953125, 305.5292053222656, 319.240234375, 332.9512939453125, 346.662353515625, 360.3733825683594, 374.08441162109375, 387.79547119140625, 401.50653076171875, 415.2175598144531, 428.9285888671875, 442.6396484375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 12.0, 18.0, 39.0, 44.0, 75.0, 81.0, 129.0, 229.0, 304.0, 489.0, 780.0, 1186.0, 2012.0, 3341.0, 5522.0, 9790.0, 17678.0, 32318.0, 63723.0, 126578.0, 251100.0, 258932.0, 132386.0, 65143.0, 33902.0, 18071.0, 10081.0, 5697.0, 3385.0, 1981.0, 1295.0, 723.0, 512.0, 324.0, 213.0, 149.0, 78.0, 67.0, 49.0, 29.0, 23.0, 17.0, 15.0, 13.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-40.71875, -39.48583984375, -38.2529296875, -37.02001953125, -35.787109375, -34.55419921875, -33.3212890625, -32.08837890625, -30.85546875, -29.62255859375, -28.3896484375, -27.15673828125, -25.923828125, -24.69091796875, -23.4580078125, -22.22509765625, -20.9921875, -19.75927734375, -18.5263671875, -17.29345703125, -16.060546875, -14.82763671875, -13.5947265625, -12.36181640625, -11.12890625, -9.89599609375, -8.6630859375, -7.43017578125, -6.197265625, -4.96435546875, -3.7314453125, -2.49853515625, -1.265625, -0.03271484375, 1.2001953125, 2.43310546875, 3.666015625, 4.89892578125, 6.1318359375, 7.36474609375, 8.59765625, 9.83056640625, 11.0634765625, 12.29638671875, 13.529296875, 14.76220703125, 15.9951171875, 17.22802734375, 18.4609375, 19.69384765625, 20.9267578125, 22.15966796875, 23.392578125, 24.62548828125, 25.8583984375, 27.09130859375, 28.32421875, 29.55712890625, 30.7900390625, 32.02294921875, 33.255859375, 34.48876953125, 35.7216796875, 36.95458984375, 38.1875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 1.0, 3.0, 8.0, 3.0, 9.0, 10.0, 13.0, 9.0, 18.0, 19.0, 24.0, 33.0, 46.0, 39.0, 43.0, 43.0, 59.0, 70.0, 60.0, 34.0, 46.0, 47.0, 48.0, 44.0, 42.0, 44.0, 23.0, 35.0, 22.0, 20.0, 23.0, 15.0, 12.0, 11.0, 5.0, 4.0, 7.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.34375, -51.77734375, -50.2109375, -48.64453125, -47.078125, -45.51171875, -43.9453125, -42.37890625, -40.8125, -39.24609375, -37.6796875, -36.11328125, -34.546875, -32.98046875, -31.4140625, -29.84765625, -28.28125, -26.71484375, -25.1484375, -23.58203125, -22.015625, -20.44921875, -18.8828125, -17.31640625, -15.75, -14.18359375, -12.6171875, -11.05078125, -9.484375, -7.91796875, -6.3515625, -4.78515625, -3.21875, -1.65234375, -0.0859375, 1.48046875, 3.046875, 4.61328125, 6.1796875, 7.74609375, 9.3125, 10.87890625, 12.4453125, 14.01171875, 15.578125, 17.14453125, 18.7109375, 20.27734375, 21.84375, 23.41015625, 24.9765625, 26.54296875, 28.109375, 29.67578125, 31.2421875, 32.80859375, 34.375, 35.94140625, 37.5078125, 39.07421875, 40.640625, 42.20703125, 43.7734375, 45.33984375, 46.90625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 9.0, 5.0, 12.0, 6.0, 13.0, 23.0, 39.0, 36.0, 80.0, 89.0, 161.0, 250.0, 583.0, 1471.0, 5413.0, 27802.0, 334125.0, 635496.0, 33660.0, 6214.0, 1670.0, 606.0, 305.0, 148.0, 92.0, 62.0, 53.0, 34.0, 31.0, 13.0, 13.0, 12.0, 5.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-135.375, -129.970703125, -124.56640625, -119.162109375, -113.7578125, -108.353515625, -102.94921875, -97.544921875, -92.140625, -86.736328125, -81.33203125, -75.927734375, -70.5234375, -65.119140625, -59.71484375, -54.310546875, -48.90625, -43.501953125, -38.09765625, -32.693359375, -27.2890625, -21.884765625, -16.48046875, -11.076171875, -5.671875, -0.267578125, 5.13671875, 10.541015625, 15.9453125, 21.349609375, 26.75390625, 32.158203125, 37.5625, 42.966796875, 48.37109375, 53.775390625, 59.1796875, 64.583984375, 69.98828125, 75.392578125, 80.796875, 86.201171875, 91.60546875, 97.009765625, 102.4140625, 107.818359375, 113.22265625, 118.626953125, 124.03125, 129.435546875, 134.83984375, 140.244140625, 145.6484375, 151.052734375, 156.45703125, 161.861328125, 167.265625, 172.669921875, 178.07421875, 183.478515625, 188.8828125, 194.287109375, 199.69140625, 205.095703125, 210.5]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 15.0, 13.0, 13.0, 13.0, 24.0, 26.0, 24.0, 50.0, 50.0, 66.0, 67.0, 88.0, 77.0, 89.0, 91.0, 62.0, 44.0, 45.0, 28.0, 28.0, 21.0, 10.0, 9.0, 13.0, 7.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-201.625, -192.599609375, -183.57421875, -174.548828125, -165.5234375, -156.498046875, -147.47265625, -138.447265625, -129.421875, -120.396484375, -111.37109375, -102.345703125, -93.3203125, -84.294921875, -75.26953125, -66.244140625, -57.21875, -48.193359375, -39.16796875, -30.142578125, -21.1171875, -12.091796875, -3.06640625, 5.958984375, 14.984375, 24.009765625, 33.03515625, 42.060546875, 51.0859375, 60.111328125, 69.13671875, 78.162109375, 87.1875, 96.212890625, 105.23828125, 114.263671875, 123.2890625, 132.314453125, 141.33984375, 150.365234375, 159.390625, 168.416015625, 177.44140625, 186.466796875, 195.4921875, 204.517578125, 213.54296875, 222.568359375, 231.59375, 240.619140625, 249.64453125, 258.669921875, 267.6953125, 276.720703125, 285.74609375, 294.771484375, 303.796875, 312.822265625, 321.84765625, 330.873046875, 339.8984375, 348.923828125, 357.94921875, 366.974609375, 376.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 11.0, 13.0, 14.0, 20.0, 32.0, 39.0, 62.0, 121.0, 214.0, 341.0, 627.0, 1413.0, 3518.0, 10588.0, 41838.0, 304161.0, 612761.0, 52904.0, 12517.0, 4137.0, 1586.0, 690.0, 382.0, 196.0, 108.0, 74.0, 58.0, 29.0, 15.0, 23.0, 13.0, 14.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.8125, -31.6435546875, -30.474609375, -29.3056640625, -28.13671875, -26.9677734375, -25.798828125, -24.6298828125, -23.4609375, -22.2919921875, -21.123046875, -19.9541015625, -18.78515625, -17.6162109375, -16.447265625, -15.2783203125, -14.109375, -12.9404296875, -11.771484375, -10.6025390625, -9.43359375, -8.2646484375, -7.095703125, -5.9267578125, -4.7578125, -3.5888671875, -2.419921875, -1.2509765625, -0.08203125, 1.0869140625, 2.255859375, 3.4248046875, 4.59375, 5.7626953125, 6.931640625, 8.1005859375, 9.26953125, 10.4384765625, 11.607421875, 12.7763671875, 13.9453125, 15.1142578125, 16.283203125, 17.4521484375, 18.62109375, 19.7900390625, 20.958984375, 22.1279296875, 23.296875, 24.4658203125, 25.634765625, 26.8037109375, 27.97265625, 29.1416015625, 30.310546875, 31.4794921875, 32.6484375, 33.8173828125, 34.986328125, 36.1552734375, 37.32421875, 38.4931640625, 39.662109375, 40.8310546875, 42.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 6.0, 15.0, 24.0, 26.0, 15.0, 44.0, 47.0, 74.0, 105.0, 135.0, 132.0, 97.0, 71.0, 60.0, 32.0, 19.0, 27.0, 15.0, 10.0, 10.0, 6.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0117950439453125, -0.01139974594116211, -0.011004447937011719, -0.010609149932861328, -0.010213851928710938, -0.009818553924560547, -0.009423255920410156, -0.009027957916259766, -0.008632659912109375, -0.008237361907958984, -0.007842063903808594, -0.007446765899658203, -0.0070514678955078125, -0.006656169891357422, -0.006260871887207031, -0.005865573883056641, -0.00547027587890625, -0.005074977874755859, -0.004679679870605469, -0.004284381866455078, -0.0038890838623046875, -0.003493785858154297, -0.0030984878540039062, -0.0027031898498535156, -0.002307891845703125, -0.0019125938415527344, -0.0015172958374023438, -0.0011219978332519531, -0.0007266998291015625, -0.0003314018249511719, 6.389617919921875e-05, 0.0004591941833496094, 0.0008544921875, 0.0012497901916503906, 0.0016450881958007812, 0.002040386199951172, 0.0024356842041015625, 0.002830982208251953, 0.0032262802124023438, 0.0036215782165527344, 0.004016876220703125, 0.004412174224853516, 0.004807472229003906, 0.005202770233154297, 0.0055980682373046875, 0.005993366241455078, 0.006388664245605469, 0.006783962249755859, 0.00717926025390625, 0.007574558258056641, 0.007969856262207031, 0.008365154266357422, 0.008760452270507812, 0.009155750274658203, 0.009551048278808594, 0.009946346282958984, 0.010341644287109375, 0.010736942291259766, 0.011132240295410156, 0.011527538299560547, 0.011922836303710938, 0.012318134307861328, 0.012713432312011719, 0.01310873031616211, 0.0135040283203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 1.0, 2.0, 12.0, 6.0, 15.0, 26.0, 28.0, 28.0, 63.0, 93.0, 166.0, 300.0, 635.0, 1521.0, 4640.0, 18892.0, 126188.0, 789077.0, 85903.0, 14515.0, 3888.0, 1334.0, 538.0, 265.0, 164.0, 93.0, 54.0, 29.0, 24.0, 25.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.34375, -46.89697265625, -45.4501953125, -44.00341796875, -42.556640625, -41.10986328125, -39.6630859375, -38.21630859375, -36.76953125, -35.32275390625, -33.8759765625, -32.42919921875, -30.982421875, -29.53564453125, -28.0888671875, -26.64208984375, -25.1953125, -23.74853515625, -22.3017578125, -20.85498046875, -19.408203125, -17.96142578125, -16.5146484375, -15.06787109375, -13.62109375, -12.17431640625, -10.7275390625, -9.28076171875, -7.833984375, -6.38720703125, -4.9404296875, -3.49365234375, -2.046875, -0.60009765625, 0.8466796875, 2.29345703125, 3.740234375, 5.18701171875, 6.6337890625, 8.08056640625, 9.52734375, 10.97412109375, 12.4208984375, 13.86767578125, 15.314453125, 16.76123046875, 18.2080078125, 19.65478515625, 21.1015625, 22.54833984375, 23.9951171875, 25.44189453125, 26.888671875, 28.33544921875, 29.7822265625, 31.22900390625, 32.67578125, 34.12255859375, 35.5693359375, 37.01611328125, 38.462890625, 39.90966796875, 41.3564453125, 42.80322265625, 44.25]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 9.0, 11.0, 7.0, 14.0, 17.0, 40.0, 59.0, 81.0, 122.0, 143.0, 127.0, 110.0, 81.0, 48.0, 26.0, 32.0, 13.0, 17.0, 11.0, 2.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.09375, -61.37841796875, -59.6630859375, -57.94775390625, -56.232421875, -54.51708984375, -52.8017578125, -51.08642578125, -49.37109375, -47.65576171875, -45.9404296875, -44.22509765625, -42.509765625, -40.79443359375, -39.0791015625, -37.36376953125, -35.6484375, -33.93310546875, -32.2177734375, -30.50244140625, -28.787109375, -27.07177734375, -25.3564453125, -23.64111328125, -21.92578125, -20.21044921875, -18.4951171875, -16.77978515625, -15.064453125, -13.34912109375, -11.6337890625, -9.91845703125, -8.203125, -6.48779296875, -4.7724609375, -3.05712890625, -1.341796875, 0.37353515625, 2.0888671875, 3.80419921875, 5.51953125, 7.23486328125, 8.9501953125, 10.66552734375, 12.380859375, 14.09619140625, 15.8115234375, 17.52685546875, 19.2421875, 20.95751953125, 22.6728515625, 24.38818359375, 26.103515625, 27.81884765625, 29.5341796875, 31.24951171875, 32.96484375, 34.68017578125, 36.3955078125, 38.11083984375, 39.826171875, 41.54150390625, 43.2568359375, 44.97216796875, 46.6875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 16.0, 34.0, 122.0, 327.0, 355.0, 95.0, 28.0, 15.0, 8.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2877.7158203125, -2820.189453125, -2762.663330078125, -2705.136962890625, -2647.61083984375, -2590.08447265625, -2532.55810546875, -2475.031982421875, -2417.505615234375, -2359.979248046875, -2302.453125, -2244.9267578125, -2187.400634765625, -2129.874267578125, -2072.34814453125, -2014.82177734375, -1957.295654296875, -1899.7694091796875, -1842.2431640625, -1784.716796875, -1727.1905517578125, -1669.664306640625, -1612.1380615234375, -1554.61181640625, -1497.08544921875, -1439.5592041015625, -1382.032958984375, -1324.506591796875, -1266.9803466796875, -1209.4541015625, -1151.9278564453125, -1094.401611328125, -1036.87548828125, -979.3492431640625, -921.8229370117188, -864.2966918945312, -806.7704467773438, -749.244140625, -691.7178955078125, -634.191650390625, -576.665283203125, -519.1390380859375, -461.6127624511719, -404.08648681640625, -346.56024169921875, -289.0339660644531, -231.5076904296875, -173.9814453125, -116.4552001953125, -58.92893600463867, -1.4026718139648438, 56.12359619140625, 113.64985656738281, 171.17611694335938, 228.702392578125, 286.2286376953125, 343.7549133300781, 401.28118896484375, 458.80743408203125, 516.333740234375, 573.8599853515625, 631.38623046875, 688.9124755859375, 746.438720703125, 803.9650268554688]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 7.0, 10.0, 4.0, 5.0, 8.0, 10.0, 13.0, 10.0, 17.0, 28.0, 25.0, 24.0, 35.0, 44.0, 39.0, 57.0, 65.0, 84.0, 89.0, 61.0, 45.0, 28.0, 29.0, 28.0, 23.0, 22.0, 26.0, 21.0, 23.0, 6.0, 14.0, 18.0, 10.0, 10.0, 4.0, 10.0, 7.0, 1.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-648.345947265625, -626.691162109375, -605.036376953125, -583.3815307617188, -561.7267456054688, -540.0719604492188, -518.4171752929688, -496.7623596191406, -475.1075439453125, -453.4527587890625, -431.7979431152344, -410.1431579589844, -388.48834228515625, -366.83355712890625, -345.17877197265625, -323.5239562988281, -301.8691711425781, -280.2143859863281, -258.5595703125, -236.90478515625, -215.24996948242188, -193.59518432617188, -171.9403839111328, -150.28558349609375, -128.6307830810547, -106.97598266601562, -85.32118225097656, -63.66638946533203, -42.01158905029297, -20.356788635253906, 1.298004150390625, 22.952804565429688, 44.60760498046875, 66.26240539550781, 87.91720581054688, 109.5719985961914, 131.226806640625, 152.881591796875, 174.53639221191406, 196.19119262695312, 217.8459930419922, 239.50079345703125, 261.15557861328125, 282.8103942871094, 304.4651794433594, 326.1199951171875, 347.7747802734375, 369.4295654296875, 391.0843811035156, 412.7391662597656, 434.39398193359375, 456.04876708984375, 477.7035827636719, 499.3583679199219, 521.01318359375, 542.66796875, 564.32275390625, 585.9775390625, 607.63232421875, 629.2871704101562, 650.9419555664062, 672.5967407226562, 694.2515258789062, 715.9063720703125, 737.5611572265625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 10.0, 8.0, 25.0, 28.0, 51.0, 66.0, 85.0, 132.0, 210.0, 365.0, 555.0, 950.0, 1709.0, 3113.0, 6487.0, 17084.0, 59253.0, 238813.0, 1040822.0, 2042804.0, 584813.0, 135691.0, 36909.0, 12663.0, 5464.0, 2679.0, 1407.0, 781.0, 483.0, 262.0, 193.0, 129.0, 78.0, 51.0, 29.0, 24.0, 17.0, 6.0, 11.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.34375, -40.94677734375, -39.5498046875, -38.15283203125, -36.755859375, -35.35888671875, -33.9619140625, -32.56494140625, -31.16796875, -29.77099609375, -28.3740234375, -26.97705078125, -25.580078125, -24.18310546875, -22.7861328125, -21.38916015625, -19.9921875, -18.59521484375, -17.1982421875, -15.80126953125, -14.404296875, -13.00732421875, -11.6103515625, -10.21337890625, -8.81640625, -7.41943359375, -6.0224609375, -4.62548828125, -3.228515625, -1.83154296875, -0.4345703125, 0.96240234375, 2.359375, 3.75634765625, 5.1533203125, 6.55029296875, 7.947265625, 9.34423828125, 10.7412109375, 12.13818359375, 13.53515625, 14.93212890625, 16.3291015625, 17.72607421875, 19.123046875, 20.52001953125, 21.9169921875, 23.31396484375, 24.7109375, 26.10791015625, 27.5048828125, 28.90185546875, 30.298828125, 31.69580078125, 33.0927734375, 34.48974609375, 35.88671875, 37.28369140625, 38.6806640625, 40.07763671875, 41.474609375, 42.87158203125, 44.2685546875, 45.66552734375, 47.0625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 8.0, 12.0, 17.0, 23.0, 23.0, 24.0, 29.0, 35.0, 33.0, 49.0, 69.0, 51.0, 57.0, 62.0, 46.0, 60.0, 54.0, 45.0, 39.0, 52.0, 32.0, 34.0, 26.0, 26.0, 15.0, 14.0, 10.0, 11.0, 5.0, 4.0, 5.0, 1.0, 4.0, 0.0, 4.0, 4.0, 4.0], "bins": [-73.375, -71.57470703125, -69.7744140625, -67.97412109375, -66.173828125, -64.37353515625, -62.5732421875, -60.77294921875, -58.97265625, -57.17236328125, -55.3720703125, -53.57177734375, -51.771484375, -49.97119140625, -48.1708984375, -46.37060546875, -44.5703125, -42.77001953125, -40.9697265625, -39.16943359375, -37.369140625, -35.56884765625, -33.7685546875, -31.96826171875, -30.16796875, -28.36767578125, -26.5673828125, -24.76708984375, -22.966796875, -21.16650390625, -19.3662109375, -17.56591796875, -15.765625, -13.96533203125, -12.1650390625, -10.36474609375, -8.564453125, -6.76416015625, -4.9638671875, -3.16357421875, -1.36328125, 0.43701171875, 2.2373046875, 4.03759765625, 5.837890625, 7.63818359375, 9.4384765625, 11.23876953125, 13.0390625, 14.83935546875, 16.6396484375, 18.43994140625, 20.240234375, 22.04052734375, 23.8408203125, 25.64111328125, 27.44140625, 29.24169921875, 31.0419921875, 32.84228515625, 34.642578125, 36.44287109375, 38.2431640625, 40.04345703125, 41.84375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 9.0, 10.0, 13.0, 32.0, 41.0, 76.0, 114.0, 282.0, 916.0, 3407.0, 21011.0, 777702.0, 3343801.0, 39599.0, 5129.0, 1233.0, 413.0, 225.0, 98.0, 52.0, 38.0, 19.0, 15.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-183.75, -178.3671875, -172.984375, -167.6015625, -162.21875, -156.8359375, -151.453125, -146.0703125, -140.6875, -135.3046875, -129.921875, -124.5390625, -119.15625, -113.7734375, -108.390625, -103.0078125, -97.625, -92.2421875, -86.859375, -81.4765625, -76.09375, -70.7109375, -65.328125, -59.9453125, -54.5625, -49.1796875, -43.796875, -38.4140625, -33.03125, -27.6484375, -22.265625, -16.8828125, -11.5, -6.1171875, -0.734375, 4.6484375, 10.03125, 15.4140625, 20.796875, 26.1796875, 31.5625, 36.9453125, 42.328125, 47.7109375, 53.09375, 58.4765625, 63.859375, 69.2421875, 74.625, 80.0078125, 85.390625, 90.7734375, 96.15625, 101.5390625, 106.921875, 112.3046875, 117.6875, 123.0703125, 128.453125, 133.8359375, 139.21875, 144.6015625, 149.984375, 155.3671875, 160.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 6.0, 6.0, 10.0, 19.0, 13.0, 22.0, 20.0, 33.0, 62.0, 102.0, 176.0, 298.0, 557.0, 804.0, 730.0, 533.0, 287.0, 148.0, 69.0, 55.0, 37.0, 24.0, 14.0, 9.0, 13.0, 5.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-105.3125, -101.9169921875, -98.521484375, -95.1259765625, -91.73046875, -88.3349609375, -84.939453125, -81.5439453125, -78.1484375, -74.7529296875, -71.357421875, -67.9619140625, -64.56640625, -61.1708984375, -57.775390625, -54.3798828125, -50.984375, -47.5888671875, -44.193359375, -40.7978515625, -37.40234375, -34.0068359375, -30.611328125, -27.2158203125, -23.8203125, -20.4248046875, -17.029296875, -13.6337890625, -10.23828125, -6.8427734375, -3.447265625, -0.0517578125, 3.34375, 6.7392578125, 10.134765625, 13.5302734375, 16.92578125, 20.3212890625, 23.716796875, 27.1123046875, 30.5078125, 33.9033203125, 37.298828125, 40.6943359375, 44.08984375, 47.4853515625, 50.880859375, 54.2763671875, 57.671875, 61.0673828125, 64.462890625, 67.8583984375, 71.25390625, 74.6494140625, 78.044921875, 81.4404296875, 84.8359375, 88.2314453125, 91.626953125, 95.0224609375, 98.41796875, 101.8134765625, 105.208984375, 108.6044921875, 112.0]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 19.0, 30.0, 55.0, 109.0, 190.0, 241.0, 157.0, 100.0, 45.0, 19.0, 7.0, 2.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-859.0454711914062, -828.9410400390625, -798.8365478515625, -768.7321166992188, -738.627685546875, -708.523193359375, -678.4187622070312, -648.3143310546875, -618.2098388671875, -588.1054077148438, -558.0009155273438, -527.896484375, -497.79205322265625, -467.6875915527344, -437.5831298828125, -407.47869873046875, -377.374267578125, -347.2698059082031, -317.1653747558594, -287.0609130859375, -256.95648193359375, -226.85202026367188, -196.74755859375, -166.6431121826172, -136.53866577148438, -106.43421936035156, -76.32976531982422, -46.225311279296875, -16.120864868164062, 13.98358154296875, 44.088043212890625, 74.19248962402344, 104.2969970703125, 134.4014434814453, 164.50588989257812, 194.6103515625, 224.7147979736328, 254.81924438476562, 284.9237060546875, 315.02813720703125, 345.1325988769531, 375.237060546875, 405.34149169921875, 435.4459533691406, 465.5504150390625, 495.65484619140625, 525.75927734375, 555.86376953125, 585.9682006835938, 616.0726318359375, 646.1771240234375, 676.2815551757812, 706.385986328125, 736.490478515625, 766.5949096679688, 796.6993408203125, 826.8038330078125, 856.9082641601562, 887.0127563476562, 917.1171875, 947.2216186523438, 977.3260498046875, 1007.4305419921875, 1037.5350341796875, 1067.639404296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 5.0, 8.0, 15.0, 24.0, 16.0, 18.0, 31.0, 33.0, 50.0, 37.0, 42.0, 48.0, 53.0, 48.0, 49.0, 53.0, 50.0, 48.0, 43.0, 65.0, 35.0, 44.0, 38.0, 28.0, 23.0, 17.0, 19.0, 15.0, 7.0, 12.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-440.7887268066406, -425.0470886230469, -409.3054504394531, -393.5638122558594, -377.8221740722656, -362.0805358886719, -346.3388671875, -330.59722900390625, -314.8555908203125, -299.11395263671875, -283.372314453125, -267.63067626953125, -251.8890380859375, -236.14739990234375, -220.40574645996094, -204.6641082763672, -188.9224853515625, -173.18084716796875, -157.439208984375, -141.69757080078125, -125.95592498779297, -110.21428680419922, -94.47264099121094, -78.73100280761719, -62.98936462402344, -47.24772644042969, -31.506084442138672, -15.764442443847656, -0.02280426025390625, 15.718833923339844, 31.460479736328125, 47.202117919921875, 62.94378662109375, 78.6854248046875, 94.42706298828125, 110.16870880126953, 125.91034698486328, 141.6519775390625, 157.3936309814453, 173.13526916503906, 188.8769073486328, 204.61854553222656, 220.3601837158203, 236.10183715820312, 251.84347534179688, 267.5851135253906, 283.3267517089844, 299.0683898925781, 314.8100280761719, 330.5516662597656, 346.2933044433594, 362.0349426269531, 377.7765808105469, 393.5182189941406, 409.2598876953125, 425.00152587890625, 440.7431640625, 456.48480224609375, 472.2264404296875, 487.96807861328125, 503.709716796875, 519.4513549804688, 535.1929931640625, 550.9346313476562, 566.67626953125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 9.0, 9.0, 27.0, 36.0, 58.0, 78.0, 138.0, 187.0, 306.0, 449.0, 800.0, 1376.0, 2526.0, 4567.0, 9098.0, 18610.0, 42402.0, 103074.0, 271164.0, 348178.0, 140545.0, 56135.0, 24609.0, 11449.0, 5588.0, 3022.0, 1602.0, 954.0, 560.0, 349.0, 240.0, 142.0, 86.0, 66.0, 50.0, 22.0, 19.0, 8.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.75, -56.978515625, -55.20703125, -53.435546875, -51.6640625, -49.892578125, -48.12109375, -46.349609375, -44.578125, -42.806640625, -41.03515625, -39.263671875, -37.4921875, -35.720703125, -33.94921875, -32.177734375, -30.40625, -28.634765625, -26.86328125, -25.091796875, -23.3203125, -21.548828125, -19.77734375, -18.005859375, -16.234375, -14.462890625, -12.69140625, -10.919921875, -9.1484375, -7.376953125, -5.60546875, -3.833984375, -2.0625, -0.291015625, 1.48046875, 3.251953125, 5.0234375, 6.794921875, 8.56640625, 10.337890625, 12.109375, 13.880859375, 15.65234375, 17.423828125, 19.1953125, 20.966796875, 22.73828125, 24.509765625, 26.28125, 28.052734375, 29.82421875, 31.595703125, 33.3671875, 35.138671875, 36.91015625, 38.681640625, 40.453125, 42.224609375, 43.99609375, 45.767578125, 47.5390625, 49.310546875, 51.08203125, 52.853515625, 54.625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 11.0, 10.0, 10.0, 18.0, 19.0, 19.0, 18.0, 21.0, 32.0, 24.0, 37.0, 37.0, 55.0, 55.0, 57.0, 45.0, 55.0, 58.0, 48.0, 44.0, 45.0, 49.0, 38.0, 24.0, 28.0, 29.0, 23.0, 17.0, 11.0, 16.0, 10.0, 12.0, 7.0, 4.0, 6.0, 0.0, 1.0, 5.0, 2.0, 2.0], "bins": [-68.6875, -66.98583984375, -65.2841796875, -63.58251953125, -61.880859375, -60.17919921875, -58.4775390625, -56.77587890625, -55.07421875, -53.37255859375, -51.6708984375, -49.96923828125, -48.267578125, -46.56591796875, -44.8642578125, -43.16259765625, -41.4609375, -39.75927734375, -38.0576171875, -36.35595703125, -34.654296875, -32.95263671875, -31.2509765625, -29.54931640625, -27.84765625, -26.14599609375, -24.4443359375, -22.74267578125, -21.041015625, -19.33935546875, -17.6376953125, -15.93603515625, -14.234375, -12.53271484375, -10.8310546875, -9.12939453125, -7.427734375, -5.72607421875, -4.0244140625, -2.32275390625, -0.62109375, 1.08056640625, 2.7822265625, 4.48388671875, 6.185546875, 7.88720703125, 9.5888671875, 11.29052734375, 12.9921875, 14.69384765625, 16.3955078125, 18.09716796875, 19.798828125, 21.50048828125, 23.2021484375, 24.90380859375, 26.60546875, 28.30712890625, 30.0087890625, 31.71044921875, 33.412109375, 35.11376953125, 36.8154296875, 38.51708984375, 40.21875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 14.0, 12.0, 22.0, 23.0, 32.0, 47.0, 85.0, 132.0, 194.0, 368.0, 804.0, 2162.0, 9157.0, 91163.0, 880387.0, 53946.0, 6795.0, 1668.0, 646.0, 349.0, 179.0, 118.0, 60.0, 42.0, 41.0, 19.0, 26.0, 14.0, 13.0, 7.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.625, -163.435546875, -157.24609375, -151.056640625, -144.8671875, -138.677734375, -132.48828125, -126.298828125, -120.109375, -113.919921875, -107.73046875, -101.541015625, -95.3515625, -89.162109375, -82.97265625, -76.783203125, -70.59375, -64.404296875, -58.21484375, -52.025390625, -45.8359375, -39.646484375, -33.45703125, -27.267578125, -21.078125, -14.888671875, -8.69921875, -2.509765625, 3.6796875, 9.869140625, 16.05859375, 22.248046875, 28.4375, 34.626953125, 40.81640625, 47.005859375, 53.1953125, 59.384765625, 65.57421875, 71.763671875, 77.953125, 84.142578125, 90.33203125, 96.521484375, 102.7109375, 108.900390625, 115.08984375, 121.279296875, 127.46875, 133.658203125, 139.84765625, 146.037109375, 152.2265625, 158.416015625, 164.60546875, 170.794921875, 176.984375, 183.173828125, 189.36328125, 195.552734375, 201.7421875, 207.931640625, 214.12109375, 220.310546875, 226.5]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 11.0, 23.0, 19.0, 29.0, 23.0, 27.0, 35.0, 41.0, 34.0, 64.0, 52.0, 71.0, 83.0, 64.0, 76.0, 53.0, 45.0, 47.0, 37.0, 32.0, 31.0, 16.0, 20.0, 11.0, 8.0, 5.0, 4.0, 5.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-241.5, -234.46875, -227.4375, -220.40625, -213.375, -206.34375, -199.3125, -192.28125, -185.25, -178.21875, -171.1875, -164.15625, -157.125, -150.09375, -143.0625, -136.03125, -129.0, -121.96875, -114.9375, -107.90625, -100.875, -93.84375, -86.8125, -79.78125, -72.75, -65.71875, -58.6875, -51.65625, -44.625, -37.59375, -30.5625, -23.53125, -16.5, -9.46875, -2.4375, 4.59375, 11.625, 18.65625, 25.6875, 32.71875, 39.75, 46.78125, 53.8125, 60.84375, 67.875, 74.90625, 81.9375, 88.96875, 96.0, 103.03125, 110.0625, 117.09375, 124.125, 131.15625, 138.1875, 145.21875, 152.25, 159.28125, 166.3125, 173.34375, 180.375, 187.40625, 194.4375, 201.46875, 208.5]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 5.0, 9.0, 15.0, 21.0, 27.0, 50.0, 57.0, 88.0, 113.0, 174.0, 279.0, 461.0, 828.0, 1501.0, 3027.0, 7033.0, 18222.0, 58683.0, 254086.0, 589384.0, 75960.0, 22405.0, 8397.0, 3659.0, 1674.0, 939.0, 527.0, 335.0, 172.0, 127.0, 86.0, 53.0, 39.0, 24.0, 16.0, 21.0, 15.0, 12.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.921875, -20.226806640625, -19.53173828125, -18.836669921875, -18.1416015625, -17.446533203125, -16.75146484375, -16.056396484375, -15.361328125, -14.666259765625, -13.97119140625, -13.276123046875, -12.5810546875, -11.885986328125, -11.19091796875, -10.495849609375, -9.80078125, -9.105712890625, -8.41064453125, -7.715576171875, -7.0205078125, -6.325439453125, -5.63037109375, -4.935302734375, -4.240234375, -3.545166015625, -2.85009765625, -2.155029296875, -1.4599609375, -0.764892578125, -0.06982421875, 0.625244140625, 1.3203125, 2.015380859375, 2.71044921875, 3.405517578125, 4.1005859375, 4.795654296875, 5.49072265625, 6.185791015625, 6.880859375, 7.575927734375, 8.27099609375, 8.966064453125, 9.6611328125, 10.356201171875, 11.05126953125, 11.746337890625, 12.44140625, 13.136474609375, 13.83154296875, 14.526611328125, 15.2216796875, 15.916748046875, 16.61181640625, 17.306884765625, 18.001953125, 18.697021484375, 19.39208984375, 20.087158203125, 20.7822265625, 21.477294921875, 22.17236328125, 22.867431640625, 23.5625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 11.0, 19.0, 25.0, 37.0, 67.0, 78.0, 144.0, 195.0, 155.0, 77.0, 60.0, 45.0, 33.0, 14.0, 6.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0211944580078125, -0.020669221878051758, -0.020143985748291016, -0.019618749618530273, -0.01909351348876953, -0.01856827735900879, -0.018043041229248047, -0.017517805099487305, -0.016992568969726562, -0.01646733283996582, -0.015942096710205078, -0.015416860580444336, -0.014891624450683594, -0.014366388320922852, -0.01384115219116211, -0.013315916061401367, -0.012790679931640625, -0.012265443801879883, -0.01174020767211914, -0.011214971542358398, -0.010689735412597656, -0.010164499282836914, -0.009639263153076172, -0.00911402702331543, -0.008588790893554688, -0.008063554763793945, -0.007538318634033203, -0.007013082504272461, -0.006487846374511719, -0.0059626102447509766, -0.005437374114990234, -0.004912137985229492, -0.00438690185546875, -0.003861665725708008, -0.0033364295959472656, -0.0028111934661865234, -0.0022859573364257812, -0.001760721206665039, -0.0012354850769042969, -0.0007102489471435547, -0.0001850128173828125, 0.0003402233123779297, 0.0008654594421386719, 0.001390695571899414, 0.0019159317016601562, 0.0024411678314208984, 0.0029664039611816406, 0.003491640090942383, 0.004016876220703125, 0.004542112350463867, 0.005067348480224609, 0.0055925846099853516, 0.006117820739746094, 0.006643056869506836, 0.007168292999267578, 0.00769352912902832, 0.008218765258789062, 0.008744001388549805, 0.009269237518310547, 0.009794473648071289, 0.010319709777832031, 0.010844945907592773, 0.011370182037353516, 0.011895418167114258, 0.012420654296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 9.0, 13.0, 19.0, 18.0, 31.0, 37.0, 37.0, 56.0, 101.0, 168.0, 303.0, 627.0, 1320.0, 3608.0, 12718.0, 62919.0, 677294.0, 239679.0, 36555.0, 8240.0, 2547.0, 1050.0, 503.0, 241.0, 154.0, 104.0, 46.0, 35.0, 28.0, 14.0, 16.0, 11.0, 9.0, 8.0, 8.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.8125, -29.8134765625, -28.814453125, -27.8154296875, -26.81640625, -25.8173828125, -24.818359375, -23.8193359375, -22.8203125, -21.8212890625, -20.822265625, -19.8232421875, -18.82421875, -17.8251953125, -16.826171875, -15.8271484375, -14.828125, -13.8291015625, -12.830078125, -11.8310546875, -10.83203125, -9.8330078125, -8.833984375, -7.8349609375, -6.8359375, -5.8369140625, -4.837890625, -3.8388671875, -2.83984375, -1.8408203125, -0.841796875, 0.1572265625, 1.15625, 2.1552734375, 3.154296875, 4.1533203125, 5.15234375, 6.1513671875, 7.150390625, 8.1494140625, 9.1484375, 10.1474609375, 11.146484375, 12.1455078125, 13.14453125, 14.1435546875, 15.142578125, 16.1416015625, 17.140625, 18.1396484375, 19.138671875, 20.1376953125, 21.13671875, 22.1357421875, 23.134765625, 24.1337890625, 25.1328125, 26.1318359375, 27.130859375, 28.1298828125, 29.12890625, 30.1279296875, 31.126953125, 32.1259765625, 33.125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 9.0, 2.0, 7.0, 3.0, 1.0, 10.0, 10.0, 14.0, 13.0, 12.0, 17.0, 26.0, 27.0, 41.0, 37.0, 48.0, 69.0, 61.0, 86.0, 68.0, 71.0, 66.0, 33.0, 59.0, 31.0, 26.0, 20.0, 20.0, 17.0, 7.0, 18.0, 11.0, 11.0, 6.0, 9.0, 7.0, 9.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-25.78125, -25.071533203125, -24.36181640625, -23.652099609375, -22.9423828125, -22.232666015625, -21.52294921875, -20.813232421875, -20.103515625, -19.393798828125, -18.68408203125, -17.974365234375, -17.2646484375, -16.554931640625, -15.84521484375, -15.135498046875, -14.42578125, -13.716064453125, -13.00634765625, -12.296630859375, -11.5869140625, -10.877197265625, -10.16748046875, -9.457763671875, -8.748046875, -8.038330078125, -7.32861328125, -6.618896484375, -5.9091796875, -5.199462890625, -4.48974609375, -3.780029296875, -3.0703125, -2.360595703125, -1.65087890625, -0.941162109375, -0.2314453125, 0.478271484375, 1.18798828125, 1.897705078125, 2.607421875, 3.317138671875, 4.02685546875, 4.736572265625, 5.4462890625, 6.156005859375, 6.86572265625, 7.575439453125, 8.28515625, 8.994873046875, 9.70458984375, 10.414306640625, 11.1240234375, 11.833740234375, 12.54345703125, 13.253173828125, 13.962890625, 14.672607421875, 15.38232421875, 16.092041015625, 16.8017578125, 17.511474609375, 18.22119140625, 18.930908203125, 19.640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 5.0, 12.0, 9.0, 42.0, 77.0, 236.0, 414.0, 117.0, 49.0, 21.0, 14.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1807.1153564453125, -1763.2694091796875, -1719.423583984375, -1675.57763671875, -1631.7318115234375, -1587.8858642578125, -1544.0400390625, -1500.194091796875, -1456.34814453125, -1412.502197265625, -1368.6563720703125, -1324.8104248046875, -1280.964599609375, -1237.11865234375, -1193.272705078125, -1149.4268798828125, -1105.5810546875, -1061.735107421875, -1017.8892822265625, -974.0433349609375, -930.1974487304688, -886.3515625, -842.5056762695312, -798.6597900390625, -754.8138427734375, -710.9679565429688, -667.1220703125, -623.276123046875, -579.4302368164062, -535.5843505859375, -491.73846435546875, -447.8925476074219, -404.046630859375, -360.20074462890625, -316.3548278808594, -272.5089416503906, -228.6630401611328, -184.817138671875, -140.97125244140625, -97.12533569335938, -53.279449462890625, -9.433551788330078, 34.41234588623047, 78.25823974609375, 122.10414123535156, 165.95004272460938, 209.79592895507812, 253.641845703125, 297.48773193359375, 341.3336181640625, 385.1795349121094, 429.0254211425781, 472.871337890625, 516.7172241210938, 560.5631103515625, 604.4090576171875, 648.2548828125, 692.1007690429688, 735.9466552734375, 779.7926025390625, 823.6384887695312, 867.484375, 911.3302612304688, 955.1761474609375, 999.0220947265625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 6.0, 11.0, 15.0, 15.0, 17.0, 9.0, 24.0, 24.0, 26.0, 36.0, 30.0, 49.0, 53.0, 115.0, 125.0, 82.0, 37.0, 44.0, 36.0, 26.0, 21.0, 22.0, 17.0, 21.0, 22.0, 22.0, 17.0, 10.0, 6.0, 9.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-632.9547119140625, -612.6290283203125, -592.3033447265625, -571.9777221679688, -551.6520385742188, -531.3263549804688, -511.00067138671875, -490.67498779296875, -470.3493347167969, -450.0236511230469, -429.697998046875, -409.372314453125, -389.046630859375, -368.7209777832031, -348.3952941894531, -328.06964111328125, -307.74395751953125, -287.41827392578125, -267.0926208496094, -246.76693725585938, -226.44126892089844, -206.1156005859375, -185.7899169921875, -165.46424865722656, -145.13858032226562, -124.81291198730469, -104.48723602294922, -84.16156005859375, -63.83589172363281, -43.510223388671875, -23.184547424316406, -2.8588714599609375, 17.46685791015625, 37.79253005981445, 58.118202209472656, 78.44387817382812, 98.76954650878906, 119.09521484375, 139.4208984375, 159.74656677246094, 180.07223510742188, 200.3979034423828, 220.72357177734375, 241.04925537109375, 261.37493896484375, 281.7005920410156, 302.0262756347656, 322.3519287109375, 342.6776123046875, 363.0032958984375, 383.3289489746094, 403.6546325683594, 423.98028564453125, 444.30596923828125, 464.63165283203125, 484.95733642578125, 505.2829895019531, 525.608642578125, 545.934326171875, 566.260009765625, 586.585693359375, 606.911376953125, 627.2369995117188, 647.5626831054688, 667.8883666992188]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 10.0, 9.0, 7.0, 16.0, 16.0, 25.0, 28.0, 36.0, 55.0, 56.0, 84.0, 117.0, 209.0, 348.0, 828.0, 2119.0, 6248.0, 26011.0, 224688.0, 2481273.0, 1324648.0, 104568.0, 15733.0, 4217.0, 1441.0, 622.0, 275.0, 174.0, 115.0, 74.0, 55.0, 41.0, 37.0, 27.0, 18.0, 10.0, 15.0, 9.0, 4.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-111.375, -107.876953125, -104.37890625, -100.880859375, -97.3828125, -93.884765625, -90.38671875, -86.888671875, -83.390625, -79.892578125, -76.39453125, -72.896484375, -69.3984375, -65.900390625, -62.40234375, -58.904296875, -55.40625, -51.908203125, -48.41015625, -44.912109375, -41.4140625, -37.916015625, -34.41796875, -30.919921875, -27.421875, -23.923828125, -20.42578125, -16.927734375, -13.4296875, -9.931640625, -6.43359375, -2.935546875, 0.5625, 4.060546875, 7.55859375, 11.056640625, 14.5546875, 18.052734375, 21.55078125, 25.048828125, 28.546875, 32.044921875, 35.54296875, 39.041015625, 42.5390625, 46.037109375, 49.53515625, 53.033203125, 56.53125, 60.029296875, 63.52734375, 67.025390625, 70.5234375, 74.021484375, 77.51953125, 81.017578125, 84.515625, 88.013671875, 91.51171875, 95.009765625, 98.5078125, 102.005859375, 105.50390625, 109.001953125, 112.5]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 17.0, 10.0, 11.0, 15.0, 15.0, 22.0, 25.0, 27.0, 34.0, 32.0, 39.0, 42.0, 50.0, 54.0, 50.0, 59.0, 40.0, 49.0, 54.0, 43.0, 44.0, 39.0, 34.0, 32.0, 25.0, 28.0, 28.0, 16.0, 11.0, 11.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-59.875, -58.33349609375, -56.7919921875, -55.25048828125, -53.708984375, -52.16748046875, -50.6259765625, -49.08447265625, -47.54296875, -46.00146484375, -44.4599609375, -42.91845703125, -41.376953125, -39.83544921875, -38.2939453125, -36.75244140625, -35.2109375, -33.66943359375, -32.1279296875, -30.58642578125, -29.044921875, -27.50341796875, -25.9619140625, -24.42041015625, -22.87890625, -21.33740234375, -19.7958984375, -18.25439453125, -16.712890625, -15.17138671875, -13.6298828125, -12.08837890625, -10.546875, -9.00537109375, -7.4638671875, -5.92236328125, -4.380859375, -2.83935546875, -1.2978515625, 0.24365234375, 1.78515625, 3.32666015625, 4.8681640625, 6.40966796875, 7.951171875, 9.49267578125, 11.0341796875, 12.57568359375, 14.1171875, 15.65869140625, 17.2001953125, 18.74169921875, 20.283203125, 21.82470703125, 23.3662109375, 24.90771484375, 26.44921875, 27.99072265625, 29.5322265625, 31.07373046875, 32.615234375, 34.15673828125, 35.6982421875, 37.23974609375, 38.78125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 5.0, 10.0, 24.0, 69.0, 150.0, 387.0, 1692.0, 37562.0, 4146052.0, 6997.0, 890.0, 274.0, 97.0, 35.0, 18.0, 10.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-565.5, -544.015625, -522.53125, -501.046875, -479.5625, -458.078125, -436.59375, -415.109375, -393.625, -372.140625, -350.65625, -329.171875, -307.6875, -286.203125, -264.71875, -243.234375, -221.75, -200.265625, -178.78125, -157.296875, -135.8125, -114.328125, -92.84375, -71.359375, -49.875, -28.390625, -6.90625, 14.578125, 36.0625, 57.546875, 79.03125, 100.515625, 122.0, 143.484375, 164.96875, 186.453125, 207.9375, 229.421875, 250.90625, 272.390625, 293.875, 315.359375, 336.84375, 358.328125, 379.8125, 401.296875, 422.78125, 444.265625, 465.75, 487.234375, 508.71875, 530.203125, 551.6875, 573.171875, 594.65625, 616.140625, 637.625, 659.109375, 680.59375, 702.078125, 723.5625, 745.046875, 766.53125, 788.015625, 809.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 14.0, 21.0, 65.0, 149.0, 355.0, 1118.0, 1555.0, 514.0, 156.0, 74.0, 37.0, 13.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-464.75, -452.5625, -440.375, -428.1875, -416.0, -403.8125, -391.625, -379.4375, -367.25, -355.0625, -342.875, -330.6875, -318.5, -306.3125, -294.125, -281.9375, -269.75, -257.5625, -245.375, -233.1875, -221.0, -208.8125, -196.625, -184.4375, -172.25, -160.0625, -147.875, -135.6875, -123.5, -111.3125, -99.125, -86.9375, -74.75, -62.5625, -50.375, -38.1875, -26.0, -13.8125, -1.625, 10.5625, 22.75, 34.9375, 47.125, 59.3125, 71.5, 83.6875, 95.875, 108.0625, 120.25, 132.4375, 144.625, 156.8125, 169.0, 181.1875, 193.375, 205.5625, 217.75, 229.9375, 242.125, 254.3125, 266.5, 278.6875, 290.875, 303.0625, 315.25]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 6.0, 7.0, 19.0, 16.0, 35.0, 52.0, 103.0, 142.0, 201.0, 148.0, 109.0, 68.0, 35.0, 20.0, 9.0, 7.0, 7.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1939.178466796875, -1887.5079345703125, -1835.8372802734375, -1784.166748046875, -1732.49609375, -1680.8255615234375, -1629.155029296875, -1577.484375, -1525.813720703125, -1474.1431884765625, -1422.4725341796875, -1370.802001953125, -1319.13134765625, -1267.4608154296875, -1215.790283203125, -1164.11962890625, -1112.4490966796875, -1060.778564453125, -1009.10791015625, -957.4373779296875, -905.7667236328125, -854.09619140625, -802.4255981445312, -750.7550048828125, -699.0844116210938, -647.413818359375, -595.7432250976562, -544.0726318359375, -492.4020690917969, -440.7314758300781, -389.0609130859375, -337.39031982421875, -285.7197265625, -234.04913330078125, -182.37855529785156, -130.70797729492188, -79.03738403320312, -27.366790771484375, 24.30377197265625, 75.974365234375, 127.64495849609375, 179.3155517578125, 230.9861297607422, 282.6567077636719, 334.3273010253906, 385.9978942871094, 437.66845703125, 489.33905029296875, 541.0096435546875, 592.6802368164062, 644.350830078125, 696.0213623046875, 747.6920166015625, 799.362548828125, 851.0331420898438, 902.7037353515625, 954.3743286132812, 1006.044921875, 1057.7154541015625, 1109.3861083984375, 1161.056640625, 1212.727294921875, 1264.3978271484375, 1316.068359375, 1367.739013671875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 8.0, 13.0, 10.0, 22.0, 22.0, 24.0, 28.0, 22.0, 30.0, 33.0, 33.0, 33.0, 34.0, 41.0, 40.0, 47.0, 53.0, 66.0, 48.0, 43.0, 38.0, 37.0, 34.0, 42.0, 28.0, 34.0, 15.0, 19.0, 13.0, 13.0, 16.0, 13.0, 9.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-781.1297607421875, -758.0313110351562, -734.9329223632812, -711.83447265625, -688.736083984375, -665.6376342773438, -642.5391845703125, -619.4407958984375, -596.3423461914062, -573.243896484375, -550.1455078125, -527.0470581054688, -503.9486389160156, -480.8502197265625, -457.7518005371094, -434.65338134765625, -411.5549621582031, -388.45654296875, -365.3581237792969, -342.25970458984375, -319.1612548828125, -296.0628356933594, -272.96441650390625, -249.86598205566406, -226.76756286621094, -203.6691436767578, -180.57070922851562, -157.4722900390625, -134.37387084960938, -111.27543640136719, -88.17701721191406, -65.07858276367188, -41.98016357421875, -18.881738662719727, 4.216686248779297, 27.315109252929688, 50.413536071777344, 73.511962890625, 96.61038208007812, 119.70881652832031, 142.80723571777344, 165.90565490722656, 189.00408935546875, 212.10250854492188, 235.200927734375, 258.29937744140625, 281.39776611328125, 304.4962158203125, 327.5946350097656, 350.69305419921875, 373.7914733886719, 396.889892578125, 419.98834228515625, 443.0867614746094, 466.1851806640625, 489.28363037109375, 512.3820190429688, 535.48046875, 558.578857421875, 581.6773071289062, 604.7756958007812, 627.8741455078125, 650.9725341796875, 674.0709838867188, 697.16943359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 2.0, 9.0, 9.0, 10.0, 18.0, 31.0, 27.0, 48.0, 62.0, 106.0, 124.0, 222.0, 322.0, 622.0, 1028.0, 1813.0, 3528.0, 7278.0, 15554.0, 37922.0, 107503.0, 451320.0, 288742.0, 78191.0, 29003.0, 12470.0, 5844.0, 2893.0, 1543.0, 880.0, 523.0, 268.0, 203.0, 141.0, 81.0, 54.0, 39.0, 32.0, 23.0, 16.0, 8.0, 13.0, 6.0, 12.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-83.6875, -81.2158203125, -78.744140625, -76.2724609375, -73.80078125, -71.3291015625, -68.857421875, -66.3857421875, -63.9140625, -61.4423828125, -58.970703125, -56.4990234375, -54.02734375, -51.5556640625, -49.083984375, -46.6123046875, -44.140625, -41.6689453125, -39.197265625, -36.7255859375, -34.25390625, -31.7822265625, -29.310546875, -26.8388671875, -24.3671875, -21.8955078125, -19.423828125, -16.9521484375, -14.48046875, -12.0087890625, -9.537109375, -7.0654296875, -4.59375, -2.1220703125, 0.349609375, 2.8212890625, 5.29296875, 7.7646484375, 10.236328125, 12.7080078125, 15.1796875, 17.6513671875, 20.123046875, 22.5947265625, 25.06640625, 27.5380859375, 30.009765625, 32.4814453125, 34.953125, 37.4248046875, 39.896484375, 42.3681640625, 44.83984375, 47.3115234375, 49.783203125, 52.2548828125, 54.7265625, 57.1982421875, 59.669921875, 62.1416015625, 64.61328125, 67.0849609375, 69.556640625, 72.0283203125, 74.5]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 3.0, 8.0, 3.0, 6.0, 14.0, 21.0, 14.0, 13.0, 27.0, 21.0, 28.0, 31.0, 38.0, 45.0, 53.0, 41.0, 54.0, 46.0, 62.0, 53.0, 46.0, 38.0, 42.0, 43.0, 32.0, 33.0, 17.0, 23.0, 25.0, 20.0, 18.0, 12.0, 9.0, 13.0, 9.0, 3.0, 4.0, 2.0, 9.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-66.5, -64.57373046875, -62.6474609375, -60.72119140625, -58.794921875, -56.86865234375, -54.9423828125, -53.01611328125, -51.08984375, -49.16357421875, -47.2373046875, -45.31103515625, -43.384765625, -41.45849609375, -39.5322265625, -37.60595703125, -35.6796875, -33.75341796875, -31.8271484375, -29.90087890625, -27.974609375, -26.04833984375, -24.1220703125, -22.19580078125, -20.26953125, -18.34326171875, -16.4169921875, -14.49072265625, -12.564453125, -10.63818359375, -8.7119140625, -6.78564453125, -4.859375, -2.93310546875, -1.0068359375, 0.91943359375, 2.845703125, 4.77197265625, 6.6982421875, 8.62451171875, 10.55078125, 12.47705078125, 14.4033203125, 16.32958984375, 18.255859375, 20.18212890625, 22.1083984375, 24.03466796875, 25.9609375, 27.88720703125, 29.8134765625, 31.73974609375, 33.666015625, 35.59228515625, 37.5185546875, 39.44482421875, 41.37109375, 43.29736328125, 45.2236328125, 47.14990234375, 49.076171875, 51.00244140625, 52.9287109375, 54.85498046875, 56.78125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 12.0, 10.0, 13.0, 21.0, 39.0, 48.0, 88.0, 142.0, 308.0, 646.0, 1701.0, 7088.0, 68428.0, 932271.0, 30940.0, 4485.0, 1218.0, 533.0, 256.0, 114.0, 62.0, 42.0, 29.0, 12.0, 18.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.75, -178.125, -170.5, -162.875, -155.25, -147.625, -140.0, -132.375, -124.75, -117.125, -109.5, -101.875, -94.25, -86.625, -79.0, -71.375, -63.75, -56.125, -48.5, -40.875, -33.25, -25.625, -18.0, -10.375, -2.75, 4.875, 12.5, 20.125, 27.75, 35.375, 43.0, 50.625, 58.25, 65.875, 73.5, 81.125, 88.75, 96.375, 104.0, 111.625, 119.25, 126.875, 134.5, 142.125, 149.75, 157.375, 165.0, 172.625, 180.25, 187.875, 195.5, 203.125, 210.75, 218.375, 226.0, 233.625, 241.25, 248.875, 256.5, 264.125, 271.75, 279.375, 287.0, 294.625, 302.25]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 3.0, 4.0, 7.0, 10.0, 17.0, 14.0, 17.0, 20.0, 25.0, 33.0, 36.0, 39.0, 51.0, 80.0, 92.0, 101.0, 91.0, 59.0, 46.0, 45.0, 33.0, 33.0, 24.0, 25.0, 16.0, 18.0, 12.0, 11.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-417.25, -405.46875, -393.6875, -381.90625, -370.125, -358.34375, -346.5625, -334.78125, -323.0, -311.21875, -299.4375, -287.65625, -275.875, -264.09375, -252.3125, -240.53125, -228.75, -216.96875, -205.1875, -193.40625, -181.625, -169.84375, -158.0625, -146.28125, -134.5, -122.71875, -110.9375, -99.15625, -87.375, -75.59375, -63.8125, -52.03125, -40.25, -28.46875, -16.6875, -4.90625, 6.875, 18.65625, 30.4375, 42.21875, 54.0, 65.78125, 77.5625, 89.34375, 101.125, 112.90625, 124.6875, 136.46875, 148.25, 160.03125, 171.8125, 183.59375, 195.375, 207.15625, 218.9375, 230.71875, 242.5, 254.28125, 266.0625, 277.84375, 289.625, 301.40625, 313.1875, 324.96875, 336.75]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 19.0, 16.0, 32.0, 78.0, 92.0, 158.0, 370.0, 902.0, 2263.0, 7338.0, 33057.0, 809606.0, 166564.0, 20274.0, 5012.0, 1574.0, 617.0, 265.0, 127.0, 67.0, 54.0, 20.0, 15.0, 7.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-52.5625, -51.3359375, -50.109375, -48.8828125, -47.65625, -46.4296875, -45.203125, -43.9765625, -42.75, -41.5234375, -40.296875, -39.0703125, -37.84375, -36.6171875, -35.390625, -34.1640625, -32.9375, -31.7109375, -30.484375, -29.2578125, -28.03125, -26.8046875, -25.578125, -24.3515625, -23.125, -21.8984375, -20.671875, -19.4453125, -18.21875, -16.9921875, -15.765625, -14.5390625, -13.3125, -12.0859375, -10.859375, -9.6328125, -8.40625, -7.1796875, -5.953125, -4.7265625, -3.5, -2.2734375, -1.046875, 0.1796875, 1.40625, 2.6328125, 3.859375, 5.0859375, 6.3125, 7.5390625, 8.765625, 9.9921875, 11.21875, 12.4453125, 13.671875, 14.8984375, 16.125, 17.3515625, 18.578125, 19.8046875, 21.03125, 22.2578125, 23.484375, 24.7109375, 25.9375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 5.0, 10.0, 8.0, 8.0, 7.0, 11.0, 19.0, 26.0, 34.0, 36.0, 53.0, 82.0, 98.0, 121.0, 116.0, 95.0, 74.0, 38.0, 23.0, 21.0, 24.0, 14.0, 9.0, 14.0, 4.0, 7.0, 8.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01104736328125, -0.010699152946472168, -0.010350942611694336, -0.010002732276916504, -0.009654521942138672, -0.00930631160736084, -0.008958101272583008, -0.008609890937805176, -0.008261680603027344, -0.007913470268249512, -0.00756525993347168, -0.007217049598693848, -0.006868839263916016, -0.006520628929138184, -0.0061724185943603516, -0.0058242082595825195, -0.0054759979248046875, -0.0051277875900268555, -0.0047795772552490234, -0.004431366920471191, -0.004083156585693359, -0.0037349462509155273, -0.0033867359161376953, -0.0030385255813598633, -0.0026903152465820312, -0.0023421049118041992, -0.001993894577026367, -0.0016456842422485352, -0.0012974739074707031, -0.0009492635726928711, -0.0006010532379150391, -0.00025284290313720703, 9.5367431640625e-05, 0.00044357776641845703, 0.0007917881011962891, 0.001139998435974121, 0.0014882087707519531, 0.0018364191055297852, 0.002184629440307617, 0.0025328397750854492, 0.0028810501098632812, 0.0032292604446411133, 0.0035774707794189453, 0.003925681114196777, 0.004273891448974609, 0.004622101783752441, 0.0049703121185302734, 0.0053185224533081055, 0.0056667327880859375, 0.0060149431228637695, 0.0063631534576416016, 0.006711363792419434, 0.007059574127197266, 0.007407784461975098, 0.00775599479675293, 0.008104205131530762, 0.008452415466308594, 0.008800625801086426, 0.009148836135864258, 0.00949704647064209, 0.009845256805419922, 0.010193467140197754, 0.010541677474975586, 0.010889887809753418, 0.01123809814453125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 11.0, 10.0, 15.0, 20.0, 36.0, 46.0, 58.0, 87.0, 152.0, 253.0, 553.0, 939.0, 2434.0, 7566.0, 33010.0, 778010.0, 195343.0, 21129.0, 5362.0, 1823.0, 790.0, 405.0, 201.0, 99.0, 61.0, 51.0, 23.0, 20.0, 7.0, 5.0, 5.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.125, -33.01953125, -31.9140625, -30.80859375, -29.703125, -28.59765625, -27.4921875, -26.38671875, -25.28125, -24.17578125, -23.0703125, -21.96484375, -20.859375, -19.75390625, -18.6484375, -17.54296875, -16.4375, -15.33203125, -14.2265625, -13.12109375, -12.015625, -10.91015625, -9.8046875, -8.69921875, -7.59375, -6.48828125, -5.3828125, -4.27734375, -3.171875, -2.06640625, -0.9609375, 0.14453125, 1.25, 2.35546875, 3.4609375, 4.56640625, 5.671875, 6.77734375, 7.8828125, 8.98828125, 10.09375, 11.19921875, 12.3046875, 13.41015625, 14.515625, 15.62109375, 16.7265625, 17.83203125, 18.9375, 20.04296875, 21.1484375, 22.25390625, 23.359375, 24.46484375, 25.5703125, 26.67578125, 27.78125, 28.88671875, 29.9921875, 31.09765625, 32.203125, 33.30859375, 34.4140625, 35.51953125, 36.625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 6.0, 5.0, 12.0, 7.0, 6.0, 11.0, 15.0, 11.0, 18.0, 21.0, 41.0, 55.0, 52.0, 87.0, 89.0, 103.0, 106.0, 80.0, 66.0, 42.0, 36.0, 27.0, 18.0, 17.0, 17.0, 12.0, 4.0, 6.0, 6.0, 4.0, 9.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.65625, -41.46826171875, -40.2802734375, -39.09228515625, -37.904296875, -36.71630859375, -35.5283203125, -34.34033203125, -33.15234375, -31.96435546875, -30.7763671875, -29.58837890625, -28.400390625, -27.21240234375, -26.0244140625, -24.83642578125, -23.6484375, -22.46044921875, -21.2724609375, -20.08447265625, -18.896484375, -17.70849609375, -16.5205078125, -15.33251953125, -14.14453125, -12.95654296875, -11.7685546875, -10.58056640625, -9.392578125, -8.20458984375, -7.0166015625, -5.82861328125, -4.640625, -3.45263671875, -2.2646484375, -1.07666015625, 0.111328125, 1.29931640625, 2.4873046875, 3.67529296875, 4.86328125, 6.05126953125, 7.2392578125, 8.42724609375, 9.615234375, 10.80322265625, 11.9912109375, 13.17919921875, 14.3671875, 15.55517578125, 16.7431640625, 17.93115234375, 19.119140625, 20.30712890625, 21.4951171875, 22.68310546875, 23.87109375, 25.05908203125, 26.2470703125, 27.43505859375, 28.623046875, 29.81103515625, 30.9990234375, 32.18701171875, 33.375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 6.0, 6.0, 17.0, 28.0, 57.0, 99.0, 455.0, 192.0, 59.0, 44.0, 15.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2002.5418701171875, -1953.463134765625, -1904.3843994140625, -1855.3056640625, -1806.2269287109375, -1757.148193359375, -1708.0694580078125, -1658.99072265625, -1609.9119873046875, -1560.833251953125, -1511.7545166015625, -1462.67578125, -1413.5970458984375, -1364.518310546875, -1315.4395751953125, -1266.36083984375, -1217.2821044921875, -1168.203369140625, -1119.1246337890625, -1070.0458984375, -1020.9671630859375, -971.888427734375, -922.8096923828125, -873.73095703125, -824.6522216796875, -775.573486328125, -726.4947509765625, -677.416015625, -628.3372802734375, -579.258544921875, -530.1798095703125, -481.10107421875, -432.0224609375, -382.9437255859375, -333.864990234375, -284.7862548828125, -235.70751953125, -186.6287841796875, -137.550048828125, -88.4713134765625, -39.392578125, 9.6861572265625, 58.764892578125, 107.8436279296875, 156.92236328125, 206.0010986328125, 255.079833984375, 304.1585693359375, 353.2373046875, 402.3160400390625, 451.394775390625, 500.4735107421875, 549.55224609375, 598.6309814453125, 647.709716796875, 696.7884521484375, 745.8671875, 794.9459228515625, 844.024658203125, 893.1033935546875, 942.18212890625, 991.2608642578125, 1040.339599609375, 1089.4183349609375, 1138.4970703125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 13.0, 4.0, 8.0, 10.0, 12.0, 16.0, 17.0, 20.0, 13.0, 24.0, 27.0, 27.0, 34.0, 62.0, 179.0, 214.0, 79.0, 38.0, 32.0, 30.0, 19.0, 20.0, 18.0, 16.0, 5.0, 8.0, 11.0, 5.0, 8.0, 5.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-811.7107543945312, -781.8485107421875, -751.9862060546875, -722.1239624023438, -692.26171875, -662.3994750976562, -632.5372314453125, -602.6749267578125, -572.8126831054688, -542.950439453125, -513.088134765625, -483.22589111328125, -453.3636474609375, -423.50140380859375, -393.6391296386719, -363.77685546875, -333.91461181640625, -304.0523681640625, -274.1900939941406, -244.3278350830078, -214.465576171875, -184.6033172607422, -154.74105834960938, -124.87879943847656, -95.01654052734375, -65.15428161621094, -35.292022705078125, -5.4297637939453125, 24.4324951171875, 54.29475402832031, 84.15701293945312, 114.01927185058594, 143.881591796875, 173.7438507080078, 203.60610961914062, 233.46836853027344, 263.33062744140625, 293.19287109375, 323.0551452636719, 352.91741943359375, 382.7796630859375, 412.64190673828125, 442.5041809082031, 472.366455078125, 502.22869873046875, 532.0909423828125, 561.9532470703125, 591.8154907226562, 621.677734375, 651.5399780273438, 681.4022216796875, 711.2645263671875, 741.1267700195312, 770.989013671875, 800.851318359375, 830.7135620117188, 860.5758056640625, 890.4380493164062, 920.30029296875, 950.16259765625, 980.0248413085938, 1009.8870849609375, 1039.7493896484375, 1069.611572265625, 1099.473876953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 9.0, 5.0, 3.0, 7.0, 10.0, 10.0, 12.0, 13.0, 17.0, 19.0, 22.0, 25.0, 36.0, 45.0, 55.0, 124.0, 196.0, 76.0, 62.0, 37.0, 29.0, 37.0, 26.0, 20.0, 26.0, 16.0, 15.0, 10.0, 11.0, 6.0, 2.0, 7.0, 2.0, 4.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.5625, -46.3974609375, -44.232421875, -42.0673828125, -39.90234375, -37.7373046875, -35.572265625, -33.4072265625, -31.2421875, -29.0771484375, -26.912109375, -24.7470703125, -22.58203125, -20.4169921875, -18.251953125, -16.0869140625, -13.921875, -11.7568359375, -9.591796875, -7.4267578125, -5.26171875, -3.0966796875, -0.931640625, 1.2333984375, 3.3984375, 5.5634765625, 7.728515625, 9.8935546875, 12.05859375, 14.2236328125, 16.388671875, 18.5537109375, 20.71875, 22.8837890625, 25.048828125, 27.2138671875, 29.37890625, 31.5439453125, 33.708984375, 35.8740234375, 38.0390625, 40.2041015625, 42.369140625, 44.5341796875, 46.69921875, 48.8642578125, 51.029296875, 53.1943359375, 55.359375, 57.5244140625, 59.689453125, 61.8544921875, 64.01953125, 66.1845703125, 68.349609375, 70.5146484375, 72.6796875, 74.8447265625, 77.009765625, 79.1748046875, 81.33984375, 83.5048828125, 85.669921875, 87.8349609375, 90.0]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 1.0, 2.0, 4.0, 10.0, 11.0, 6.0, 13.0, 15.0, 21.0, 24.0, 24.0, 60.0, 106.0, 167.0, 336.0, 721.0, 2171.0, 9514.0, 8327996.0, 40952.0, 4274.0, 1166.0, 470.0, 171.0, 114.0, 63.0, 54.0, 25.0, 16.0, 10.0, 14.0, 6.0, 6.0, 9.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-537.6149291992188, -522.1497192382812, -506.6845397949219, -491.2193603515625, -475.754150390625, -460.2889709472656, -444.8237609863281, -429.35858154296875, -413.89337158203125, -398.4281921386719, -382.9629821777344, -367.497802734375, -352.0325927734375, -336.5674133300781, -321.1022033691406, -305.63702392578125, -290.17181396484375, -274.7066345214844, -259.2414245605469, -243.77622985839844, -228.31103515625, -212.84585571289062, -197.38064575195312, -181.91546630859375, -166.45028686523438, -150.98509216308594, -135.5198974609375, -120.05470275878906, -104.58950805664062, -89.12432098388672, -73.65912628173828, -58.193931579589844, -42.728729248046875, -27.263534545898438, -11.798341751098633, 3.666851043701172, 19.13204574584961, 34.59723663330078, 50.06243133544922, 65.52762603759766, 80.9928207397461, 96.45801544189453, 111.92321014404297, 127.38839721679688, 142.8535919189453, 158.31878662109375, 173.7839813232422, 189.24917602539062, 204.71437072753906, 220.1795654296875, 235.64476013183594, 251.10995483398438, 266.57513427734375, 282.04034423828125, 297.5055236816406, 312.9707336425781, 328.4359130859375, 343.9010925292969, 359.3663024902344, 374.83148193359375, 390.29669189453125, 405.7618713378906, 421.2270812988281, 436.6922607421875, 452.157470703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 6.0, 6.0, 9.0, 7.0, 10.0, 4.0, 7.0, 3.0, 5.0, 5.0, 7.0, 5.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-373.5076904296875, -359.2933044433594, -345.07891845703125, -330.8645324707031, -316.650146484375, -302.4357604980469, -288.22137451171875, -274.0069885253906, -259.7926025390625, -245.57821655273438, -231.36383056640625, -217.14944458007812, -202.93505859375, -188.72067260742188, -174.50628662109375, -160.29190063476562, -146.07752990722656, -131.86314392089844, -117.64875793457031, -103.43437194824219, -89.21998596191406, -75.00560760498047, -60.791221618652344, -46.57683563232422, -32.362449645996094, -18.14806365966797, -3.9336795806884766, 10.280704498291016, 24.49509048461914, 38.70947265625, 52.923858642578125, 67.13824462890625, 81.35263061523438, 95.5670166015625, 109.78140258789062, 123.99578857421875, 138.21017456054688, 152.424560546875, 166.63894653320312, 180.85333251953125, 195.06771850585938, 209.2821044921875, 223.49649047851562, 237.71087646484375, 251.92526245117188, 266.1396484375, 280.3540344238281, 294.56842041015625, 308.78277587890625, 322.9971618652344, 337.2115478515625, 351.4259338378906, 365.64031982421875, 379.8547058105469, 394.069091796875, 408.2834777832031, 422.49786376953125, 436.7122497558594, 450.9266357421875, 465.1410217285156, 479.35540771484375, 493.5697937011719, 507.7841796875, 521.99853515625, 536.2129516601562]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 8.0, 7.0, 10.0, 9.0, 16.0, 16.0, 30.0, 31.0, 40.0, 51.0, 60.0, 56.0, 62.0, 80.0, 77.0, 71.0, 64.0, 55.0, 40.0, 38.0, 41.0, 28.0, 24.0, 26.0, 13.0, 20.0, 6.0, 7.0, 3.0, 1.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.875, -37.3623046875, -35.849609375, -34.3369140625, -32.82421875, -31.3115234375, -29.798828125, -28.2861328125, -26.7734375, -25.2607421875, -23.748046875, -22.2353515625, -20.72265625, -19.2099609375, -17.697265625, -16.1845703125, -14.671875, -13.1591796875, -11.646484375, -10.1337890625, -8.62109375, -7.1083984375, -5.595703125, -4.0830078125, -2.5703125, -1.0576171875, 0.455078125, 1.9677734375, 3.48046875, 4.9931640625, 6.505859375, 8.0185546875, 9.53125, 11.0439453125, 12.556640625, 14.0693359375, 15.58203125, 17.0947265625, 18.607421875, 20.1201171875, 21.6328125, 23.1455078125, 24.658203125, 26.1708984375, 27.68359375, 29.1962890625, 30.708984375, 32.2216796875, 33.734375, 35.2470703125, 36.759765625, 38.2724609375, 39.78515625, 41.2978515625, 42.810546875, 44.3232421875, 45.8359375, 47.3486328125, 48.861328125, 50.3740234375, 51.88671875, 53.3994140625, 54.912109375, 56.4248046875, 57.9375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 11.0, 5.0, 4.0, 8.0, 19.0, 16.0, 23.0, 41.0, 72.0, 102.0, 153.0, 257.0, 493.0, 731.0, 1441.0, 2833.0, 6169.0, 14143.0, 35592.0, 97478.0, 189860.0, 106797.0, 39414.0, 15538.0, 6551.0, 3153.0, 1453.0, 776.0, 477.0, 249.0, 163.0, 92.0, 53.0, 32.0, 25.0, 15.0, 12.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-409.25, -398.3515625, -387.453125, -376.5546875, -365.65625, -354.7578125, -343.859375, -332.9609375, -322.0625, -311.1640625, -300.265625, -289.3671875, -278.46875, -267.5703125, -256.671875, -245.7734375, -234.875, -223.9765625, -213.078125, -202.1796875, -191.28125, -180.3828125, -169.484375, -158.5859375, -147.6875, -136.7890625, -125.890625, -114.9921875, -104.09375, -93.1953125, -82.296875, -71.3984375, -60.5, -49.6015625, -38.703125, -27.8046875, -16.90625, -6.0078125, 4.890625, 15.7890625, 26.6875, 37.5859375, 48.484375, 59.3828125, 70.28125, 81.1796875, 92.078125, 102.9765625, 113.875, 124.7734375, 135.671875, 146.5703125, 157.46875, 168.3671875, 179.265625, 190.1640625, 201.0625, 211.9609375, 222.859375, 233.7578125, 244.65625, 255.5546875, 266.453125, 277.3515625, 288.25]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 8.0, 10.0, 15.0, 15.0, 12.0, 29.0, 23.0, 29.0, 36.0, 31.0, 51.0, 45.0, 54.0, 62.0, 53.0, 68.0, 51.0, 59.0, 64.0, 53.0, 40.0, 35.0, 28.0, 23.0, 13.0, 17.0, 18.0, 6.0, 8.0, 6.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.25, -56.19921875, -54.1484375, -52.09765625, -50.046875, -47.99609375, -45.9453125, -43.89453125, -41.84375, -39.79296875, -37.7421875, -35.69140625, -33.640625, -31.58984375, -29.5390625, -27.48828125, -25.4375, -23.38671875, -21.3359375, -19.28515625, -17.234375, -15.18359375, -13.1328125, -11.08203125, -9.03125, -6.98046875, -4.9296875, -2.87890625, -0.828125, 1.22265625, 3.2734375, 5.32421875, 7.375, 9.42578125, 11.4765625, 13.52734375, 15.578125, 17.62890625, 19.6796875, 21.73046875, 23.78125, 25.83203125, 27.8828125, 29.93359375, 31.984375, 34.03515625, 36.0859375, 38.13671875, 40.1875, 42.23828125, 44.2890625, 46.33984375, 48.390625, 50.44140625, 52.4921875, 54.54296875, 56.59375, 58.64453125, 60.6953125, 62.74609375, 64.796875, 66.84765625, 68.8984375, 70.94921875, 73.0]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 6.0, 3.0, 4.0, 5.0, 14.0, 22.0, 34.0, 64.0, 56.0, 68.0, 47.0, 50.0, 31.0, 14.0, 17.0, 11.0, 8.0, 9.0, 6.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-356.912353515625, -344.955322265625, -332.998291015625, -321.041259765625, -309.0841979980469, -297.1271667480469, -285.1701354980469, -273.2131042480469, -261.2560729980469, -249.29904174804688, -237.3419952392578, -225.3849639892578, -213.4279327392578, -201.47088623046875, -189.51385498046875, -177.55682373046875, -165.5997772216797, -153.6427459716797, -141.68569946289062, -129.72866821289062, -117.77163696289062, -105.8145980834961, -93.85755920410156, -81.90052795410156, -69.94348907470703, -57.986454010009766, -46.0294189453125, -34.07238006591797, -22.115345001220703, -10.158309936523438, 1.7987289428710938, 13.755760192871094, 25.712799072265625, 37.66983413696289, 49.626869201660156, 61.58390808105469, 73.54093933105469, 85.49797821044922, 97.45501708984375, 109.41204833984375, 121.36908721923828, 133.3261260986328, 145.2831573486328, 157.24020385742188, 169.19723510742188, 181.15426635742188, 193.11129760742188, 205.06832885742188, 217.02537536621094, 228.98240661621094, 240.939453125, 252.896484375, 264.853515625, 276.810546875, 288.767578125, 300.724609375, 312.6816711425781, 324.6387023925781, 336.5957336425781, 348.55279541015625, 360.50982666015625, 372.46685791015625, 384.42388916015625, 396.38092041015625, 408.33795166015625]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 6.0, 6.0, 3.0, 5.0, 2.0, 9.0, 12.0, 21.0, 67.0, 87.0, 89.0, 53.0, 39.0, 17.0, 11.0, 10.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-300.09393310546875, -287.365966796875, -274.63800048828125, -261.9100646972656, -249.18209838867188, -236.45413208007812, -223.72616577148438, -210.9982147216797, -198.270263671875, -185.54229736328125, -172.81434631347656, -160.0863800048828, -147.35842895507812, -134.63046264648438, -121.90250396728516, -109.17454528808594, -96.44657897949219, -83.71862030029297, -70.99066162109375, -58.262699127197266, -45.53474044799805, -32.80678176879883, -20.078819274902344, -7.350860595703125, 5.377098083496094, 18.105056762695312, 30.833017349243164, 43.560977935791016, 56.288936614990234, 69.01689147949219, 81.74485778808594, 94.47281646728516, 107.20077514648438, 119.9287338256836, 132.6566925048828, 145.38465881347656, 158.11260986328125, 170.840576171875, 183.56854248046875, 196.29649353027344, 209.02444458007812, 221.75241088867188, 234.48036193847656, 247.2083282470703, 259.936279296875, 272.66424560546875, 285.3922119140625, 298.12017822265625, 310.84814453125, 323.57611083984375, 336.3040771484375, 349.0320129394531, 361.7599792480469, 374.4879455566406, 387.2159118652344, 399.94384765625, 412.67181396484375, 425.3997802734375, 438.12774658203125, 450.8556823730469, 463.5836486816406, 476.3116149902344, 489.0395812988281, 501.76751708984375, 514.4954833984375]}, "eval/loss": 0.6976933479309082, "eval/wer": 0.12308607695358985, "eval/runtime": 636.3851, "eval/samples_per_second": 4.152, "eval/steps_per_second": 0.52, "train/train_runtime": 134751.1179, "train/train_samples_per_second": 5.295, "train/train_steps_per_second": 0.165, "train/total_flos": 0.0, "train/train_loss": 1.8353804810692644} \ No newline at end of file