diff --git "a/wandb/run-20220504_095140-cwhobv6l/files/wandb-summary.json" "b/wandb/run-20220504_095140-cwhobv6l/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220504_095140-cwhobv6l/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 5.2025, "train/learning_rate": 0.0002960940198345447, "train/epoch": 0.03, "train/global_step": 170, "_runtime": 549, "_timestamp": 1651658449, "_step": 169, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 393.0, 558.0, 38.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.791566848754883, -12.933463096618652, -12.075359344482422, -11.217254638671875, -10.359150886535645, -9.501047134399414, -8.642942428588867, -7.784838676452637, -6.926734924316406, -6.068631172180176, -5.210526943206787, -4.352422714233398, -3.494318962097168, -2.6362152099609375, -1.7781109809875488, -0.9200067520141602, -0.06190299987792969, 0.7962009906768799, 1.6543049812316895, 2.512408971786499, 3.3705129623413086, 4.228616714477539, 5.086720943450928, 5.944825172424316, 6.802928924560547, 7.661032676696777, 8.519136428833008, 9.377241134643555, 10.235344886779785, 11.093448638916016, 11.951553344726562, 12.809657096862793, 13.66775894165039, 14.525862693786621, 15.383966445922852, 16.2420711517334, 17.100173950195312, 17.95827865600586, 18.816383361816406, 19.674488067626953, 20.532590866088867, 21.390695571899414, 22.248798370361328, 23.106903076171875, 23.965007781982422, 24.823110580444336, 25.681215286254883, 26.539318084716797, 27.397422790527344, 28.25552749633789, 29.113630294799805, 29.97173500061035, 30.829837799072266, 31.687942504882812, 32.54604721069336, 33.404151916503906, 34.26225280761719, 35.120357513427734, 35.97846221923828, 36.83656311035156, 37.69466781616211, 38.552772521972656, 39.4108772277832, 40.26898193359375, 41.1270866394043]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 9.0, 21.0, 24.0, 29.0, 50.0, 66.0, 70.0, 102.0, 104.0, 90.0, 88.0, 87.0, 70.0, 53.0, 39.0, 36.0, 23.0, 19.0, 9.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.638748168945312, -10.282394409179688, -9.926039695739746, -9.569684982299805, -9.21333122253418, -8.856977462768555, -8.500622749328613, -8.144268035888672, -7.787914276123047, -7.431560039520264, -7.0752058029174805, -6.718851566314697, -6.362497329711914, -6.006143093109131, -5.649788856506348, -5.2934346199035645, -4.937080383300781, -4.580726146697998, -4.224371910095215, -3.8680176734924316, -3.5116634368896484, -3.1553092002868652, -2.798954963684082, -2.442600727081299, -2.0862464904785156, -1.7298922538757324, -1.3735380172729492, -1.017183780670166, -0.6608295440673828, -0.3044753074645996, 0.051878929138183594, 0.4082331657409668, 0.76458740234375, 1.1209416389465332, 1.4772958755493164, 1.8336501121520996, 2.190004348754883, 2.546358585357666, 2.902712821960449, 3.2590670585632324, 3.6154212951660156, 3.971775531768799, 4.328129768371582, 4.684484004974365, 5.040838241577148, 5.397192478179932, 5.753546714782715, 6.109900951385498, 6.466255187988281, 6.8226094245910645, 7.178963661193848, 7.535317897796631, 7.891672134399414, 8.248025894165039, 8.60438060760498, 8.960735321044922, 9.317089080810547, 9.673442840576172, 10.029797554016113, 10.386152267456055, 10.74250602722168, 11.098859786987305, 11.455214500427246, 11.811569213867188, 12.167922973632812]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 4.0, 10.0, 23.0, 43.0, 69.0, 351.0, 1606.0, 10019.0, 236859.0, 3344025.0, 585453.0, 13161.0, 1998.0, 441.0, 118.0, 37.0, 24.0, 10.0, 5.0, 3.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.78125, -12.318359375, -11.85546875, -11.392578125, -10.9296875, -10.466796875, -10.00390625, -9.541015625, -9.078125, -8.615234375, -8.15234375, -7.689453125, -7.2265625, -6.763671875, -6.30078125, -5.837890625, -5.375, -4.912109375, -4.44921875, -3.986328125, -3.5234375, -3.060546875, -2.59765625, -2.134765625, -1.671875, -1.208984375, -0.74609375, -0.283203125, 0.1796875, 0.642578125, 1.10546875, 1.568359375, 2.03125, 2.494140625, 2.95703125, 3.419921875, 3.8828125, 4.345703125, 4.80859375, 5.271484375, 5.734375, 6.197265625, 6.66015625, 7.123046875, 7.5859375, 8.048828125, 8.51171875, 8.974609375, 9.4375, 9.900390625, 10.36328125, 10.826171875, 11.2890625, 11.751953125, 12.21484375, 12.677734375, 13.140625, 13.603515625, 14.06640625, 14.529296875, 14.9921875, 15.455078125, 15.91796875, 16.380859375, 16.84375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 6.0, 12.0, 10.0, 20.0, 27.0, 26.0, 33.0, 48.0, 46.0, 49.0, 61.0, 76.0, 73.0, 53.0, 71.0, 66.0, 60.0, 57.0, 46.0, 41.0, 30.0, 27.0, 20.0, 11.0, 11.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0078125, -7.76068115234375, -7.5135498046875, -7.26641845703125, -7.019287109375, -6.77215576171875, -6.5250244140625, -6.27789306640625, -6.03076171875, -5.78363037109375, -5.5364990234375, -5.28936767578125, -5.042236328125, -4.79510498046875, -4.5479736328125, -4.30084228515625, -4.0537109375, -3.80657958984375, -3.5594482421875, -3.31231689453125, -3.065185546875, -2.81805419921875, -2.5709228515625, -2.32379150390625, -2.07666015625, -1.82952880859375, -1.5823974609375, -1.33526611328125, -1.088134765625, -0.84100341796875, -0.5938720703125, -0.34674072265625, -0.099609375, 0.14752197265625, 0.3946533203125, 0.64178466796875, 0.888916015625, 1.13604736328125, 1.3831787109375, 1.63031005859375, 1.87744140625, 2.12457275390625, 2.3717041015625, 2.61883544921875, 2.865966796875, 3.11309814453125, 3.3602294921875, 3.60736083984375, 3.8544921875, 4.10162353515625, 4.3487548828125, 4.59588623046875, 4.843017578125, 5.09014892578125, 5.3372802734375, 5.58441162109375, 5.83154296875, 6.07867431640625, 6.3258056640625, 6.57293701171875, 6.820068359375, 7.06719970703125, 7.3143310546875, 7.56146240234375, 7.80859375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 17.0, 24.0, 60.0, 127.0, 389.0, 342557.0, 3850353.0, 486.0, 139.0, 52.0, 28.0, 15.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.875, -133.796875, -127.71875, -121.640625, -115.5625, -109.484375, -103.40625, -97.328125, -91.25, -85.171875, -79.09375, -73.015625, -66.9375, -60.859375, -54.78125, -48.703125, -42.625, -36.546875, -30.46875, -24.390625, -18.3125, -12.234375, -6.15625, -0.078125, 6.0, 12.078125, 18.15625, 24.234375, 30.3125, 36.390625, 42.46875, 48.546875, 54.625, 60.703125, 66.78125, 72.859375, 78.9375, 85.015625, 91.09375, 97.171875, 103.25, 109.328125, 115.40625, 121.484375, 127.5625, 133.640625, 139.71875, 145.796875, 151.875, 157.953125, 164.03125, 170.109375, 176.1875, 182.265625, 188.34375, 194.421875, 200.5, 206.578125, 212.65625, 218.734375, 224.8125, 230.890625, 236.96875, 243.046875, 249.125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 13.0, 16.0, 31.0, 79.0, 167.0, 461.0, 1477.0, 1221.0, 351.0, 125.0, 56.0, 26.0, 19.0, 7.0, 10.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.840545654296875, -2.71038818359375, -2.580230712890625, -2.4500732421875, -2.319915771484375, -2.18975830078125, -2.059600830078125, -1.929443359375, -1.799285888671875, -1.66912841796875, -1.538970947265625, -1.4088134765625, -1.278656005859375, -1.14849853515625, -1.018341064453125, -0.88818359375, -0.758026123046875, -0.62786865234375, -0.497711181640625, -0.3675537109375, -0.237396240234375, -0.10723876953125, 0.022918701171875, 0.153076171875, 0.283233642578125, 0.41339111328125, 0.543548583984375, 0.6737060546875, 0.803863525390625, 0.93402099609375, 1.064178466796875, 1.1943359375, 1.324493408203125, 1.45465087890625, 1.584808349609375, 1.7149658203125, 1.845123291015625, 1.97528076171875, 2.105438232421875, 2.235595703125, 2.365753173828125, 2.49591064453125, 2.626068115234375, 2.7562255859375, 2.886383056640625, 3.01654052734375, 3.146697998046875, 3.27685546875, 3.407012939453125, 3.53717041015625, 3.667327880859375, 3.7974853515625, 3.927642822265625, 4.05780029296875, 4.187957763671875, 4.318115234375, 4.448272705078125, 4.57843017578125, 4.708587646484375, 4.8387451171875, 4.968902587890625, 5.09906005859375, 5.229217529296875, 5.359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 9.0, 9.0, 24.0, 50.0, 94.0, 181.0, 257.0, 172.0, 119.0, 51.0, 26.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.08782386779785, -19.582401275634766, -19.07697868347168, -18.571556091308594, -18.066133499145508, -17.560710906982422, -17.055288314819336, -16.54986572265625, -16.044443130493164, -15.539020538330078, -15.033597946166992, -14.528175354003906, -14.02275276184082, -13.517330169677734, -13.011907577514648, -12.506484985351562, -12.001062393188477, -11.49563980102539, -10.990217208862305, -10.484794616699219, -9.979372024536133, -9.473949432373047, -8.968526840209961, -8.463104248046875, -7.957681655883789, -7.452259063720703, -6.946836471557617, -6.441413879394531, -5.935991287231445, -5.430568695068359, -4.925146102905273, -4.4197235107421875, -3.9142990112304688, -3.408876419067383, -2.903453826904297, -2.398031234741211, -1.892608642578125, -1.387186050415039, -0.8817634582519531, -0.3763408660888672, 0.12908172607421875, 0.6345043182373047, 1.1399269104003906, 1.6453495025634766, 2.1507720947265625, 2.6561946868896484, 3.1616172790527344, 3.6670398712158203, 4.172462463378906, 4.677885055541992, 5.183307647705078, 5.688730239868164, 6.19415283203125, 6.699575424194336, 7.204998016357422, 7.710420608520508, 8.215843200683594, 8.72126579284668, 9.226688385009766, 9.732110977172852, 10.237533569335938, 10.742956161499023, 11.24837875366211, 11.753801345825195, 12.259223937988281]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 7.0, 20.0, 24.0, 26.0, 34.0, 37.0, 62.0, 63.0, 68.0, 63.0, 74.0, 85.0, 81.0, 66.0, 54.0, 53.0, 44.0, 27.0, 27.0, 32.0, 13.0, 12.0, 5.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.967407703399658, -6.700961112976074, -6.434514045715332, -6.168067455291748, -5.901620864868164, -5.635173797607422, -5.368727207183838, -5.102280616760254, -4.835833549499512, -4.569386959075928, -4.3029398918151855, -4.036493301391602, -3.7700467109680176, -3.5035998821258545, -3.2371530532836914, -2.9707064628601074, -2.7042598724365234, -2.4378130435943604, -2.1713664531707764, -1.9049196243286133, -1.6384729146957397, -1.3720262050628662, -1.1055793762207031, -0.8391326665878296, -0.572685956954956, -0.30623921751976013, -0.03979247808456421, 0.2266542911529541, 0.49310100078582764, 0.7595477104187012, 1.0259945392608643, 1.2924412488937378, 1.5588884353637695, 1.825335144996643, 2.0917818546295166, 2.3582286834716797, 2.6246752738952637, 2.8911221027374268, 3.15756893157959, 3.424015522003174, 3.690462350845337, 3.9569091796875, 4.223355770111084, 4.489802360534668, 4.75624942779541, 5.022696018218994, 5.289142608642578, 5.55558967590332, 5.822036266326904, 6.088482856750488, 6.3549299240112305, 6.6213765144348145, 6.887823104858398, 7.154270172119141, 7.420716762542725, 7.687163352966309, 7.953610420227051, 8.220057487487793, 8.486503601074219, 8.752950668334961, 9.019397735595703, 9.285843849182129, 9.552290916442871, 9.818737983703613, 10.085184097290039]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 9.0, 12.0, 17.0, 28.0, 25.0, 59.0, 100.0, 177.0, 251.0, 504.0, 1074.0, 2441.0, 7769.0, 48887.0, 721345.0, 236647.0, 21258.0, 4438.0, 1685.0, 814.0, 425.0, 206.0, 144.0, 82.0, 45.0, 20.0, 19.0, 7.0, 11.0, 3.0, 5.0, 4.0, 8.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.9296875, -2.845489501953125, -2.76129150390625, -2.677093505859375, -2.5928955078125, -2.508697509765625, -2.42449951171875, -2.340301513671875, -2.256103515625, -2.171905517578125, -2.08770751953125, -2.003509521484375, -1.9193115234375, -1.835113525390625, -1.75091552734375, -1.666717529296875, -1.58251953125, -1.498321533203125, -1.41412353515625, -1.329925537109375, -1.2457275390625, -1.161529541015625, -1.07733154296875, -0.993133544921875, -0.908935546875, -0.824737548828125, -0.74053955078125, -0.656341552734375, -0.5721435546875, -0.487945556640625, -0.40374755859375, -0.319549560546875, -0.2353515625, -0.151153564453125, -0.06695556640625, 0.017242431640625, 0.1014404296875, 0.185638427734375, 0.26983642578125, 0.354034423828125, 0.438232421875, 0.522430419921875, 0.60662841796875, 0.690826416015625, 0.7750244140625, 0.859222412109375, 0.94342041015625, 1.027618408203125, 1.11181640625, 1.196014404296875, 1.28021240234375, 1.364410400390625, 1.4486083984375, 1.532806396484375, 1.61700439453125, 1.701202392578125, 1.785400390625, 1.869598388671875, 1.95379638671875, 2.037994384765625, 2.1221923828125, 2.206390380859375, 2.29058837890625, 2.374786376953125, 2.458984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 11.0, 13.0, 16.0, 26.0, 47.0, 59.0, 69.0, 91.0, 86.0, 86.0, 94.0, 105.0, 79.0, 55.0, 49.0, 36.0, 29.0, 17.0, 15.0, 13.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1484375, -7.868408203125, -7.58837890625, -7.308349609375, -7.0283203125, -6.748291015625, -6.46826171875, -6.188232421875, -5.908203125, -5.628173828125, -5.34814453125, -5.068115234375, -4.7880859375, -4.508056640625, -4.22802734375, -3.947998046875, -3.66796875, -3.387939453125, -3.10791015625, -2.827880859375, -2.5478515625, -2.267822265625, -1.98779296875, -1.707763671875, -1.427734375, -1.147705078125, -0.86767578125, -0.587646484375, -0.3076171875, -0.027587890625, 0.25244140625, 0.532470703125, 0.8125, 1.092529296875, 1.37255859375, 1.652587890625, 1.9326171875, 2.212646484375, 2.49267578125, 2.772705078125, 3.052734375, 3.332763671875, 3.61279296875, 3.892822265625, 4.1728515625, 4.452880859375, 4.73291015625, 5.012939453125, 5.29296875, 5.572998046875, 5.85302734375, 6.133056640625, 6.4130859375, 6.693115234375, 6.97314453125, 7.253173828125, 7.533203125, 7.813232421875, 8.09326171875, 8.373291015625, 8.6533203125, 8.933349609375, 9.21337890625, 9.493408203125, 9.7734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 3.0, 5.0, 14.0, 7.0, 22.0, 39.0, 37.0, 82.0, 116.0, 152.0, 227.0, 347.0, 539.0, 877.0, 1483.0, 2270.0, 3902.0, 6496.0, 11087.0, 19407.0, 35271.0, 68247.0, 142150.0, 286583.0, 236345.0, 108908.0, 54435.0, 29310.0, 16485.0, 9265.0, 5630.0, 3363.0, 2004.0, 1295.0, 804.0, 463.0, 296.0, 170.0, 142.0, 73.0, 60.0, 39.0, 25.0, 28.0, 11.0, 11.0, 9.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.48291015625, -0.46863555908203125, -0.4543609619140625, -0.44008636474609375, -0.425811767578125, -0.41153717041015625, -0.3972625732421875, -0.38298797607421875, -0.36871337890625, -0.35443878173828125, -0.3401641845703125, -0.32588958740234375, -0.311614990234375, -0.29734039306640625, -0.2830657958984375, -0.26879119873046875, -0.2545166015625, -0.24024200439453125, -0.2259674072265625, -0.21169281005859375, -0.197418212890625, -0.18314361572265625, -0.1688690185546875, -0.15459442138671875, -0.14031982421875, -0.12604522705078125, -0.1117706298828125, -0.09749603271484375, -0.083221435546875, -0.06894683837890625, -0.0546722412109375, -0.04039764404296875, -0.026123046875, -0.01184844970703125, 0.0024261474609375, 0.01670074462890625, 0.030975341796875, 0.04524993896484375, 0.0595245361328125, 0.07379913330078125, 0.08807373046875, 0.10234832763671875, 0.1166229248046875, 0.13089752197265625, 0.145172119140625, 0.15944671630859375, 0.1737213134765625, 0.18799591064453125, 0.2022705078125, 0.21654510498046875, 0.2308197021484375, 0.24509429931640625, 0.259368896484375, 0.27364349365234375, 0.2879180908203125, 0.30219268798828125, 0.31646728515625, 0.33074188232421875, 0.3450164794921875, 0.35929107666015625, 0.373565673828125, 0.38784027099609375, 0.4021148681640625, 0.41638946533203125, 0.4306640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 9.0, 5.0, 5.0, 4.0, 8.0, 14.0, 12.0, 11.0, 24.0, 21.0, 18.0, 29.0, 21.0, 29.0, 27.0, 19.0, 34.0, 31.0, 41.0, 30.0, 33.0, 41.0, 39.0, 34.0, 32.0, 40.0, 32.0, 46.0, 24.0, 29.0, 28.0, 36.0, 31.0, 22.0, 17.0, 19.0, 18.0, 17.0, 13.0, 14.0, 9.0, 11.0, 6.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.54296875, -7.31463623046875, -7.0863037109375, -6.85797119140625, -6.629638671875, -6.40130615234375, -6.1729736328125, -5.94464111328125, -5.71630859375, -5.48797607421875, -5.2596435546875, -5.03131103515625, -4.802978515625, -4.57464599609375, -4.3463134765625, -4.11798095703125, -3.8896484375, -3.66131591796875, -3.4329833984375, -3.20465087890625, -2.976318359375, -2.74798583984375, -2.5196533203125, -2.29132080078125, -2.06298828125, -1.83465576171875, -1.6063232421875, -1.37799072265625, -1.149658203125, -0.92132568359375, -0.6929931640625, -0.46466064453125, -0.236328125, -0.00799560546875, 0.2203369140625, 0.44866943359375, 0.677001953125, 0.90533447265625, 1.1336669921875, 1.36199951171875, 1.59033203125, 1.81866455078125, 2.0469970703125, 2.27532958984375, 2.503662109375, 2.73199462890625, 2.9603271484375, 3.18865966796875, 3.4169921875, 3.64532470703125, 3.8736572265625, 4.10198974609375, 4.330322265625, 4.55865478515625, 4.7869873046875, 5.01531982421875, 5.24365234375, 5.47198486328125, 5.7003173828125, 5.92864990234375, 6.156982421875, 6.38531494140625, 6.6136474609375, 6.84197998046875, 7.0703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 5.0, 4.0, 8.0, 12.0, 16.0, 13.0, 31.0, 38.0, 62.0, 72.0, 102.0, 164.0, 271.0, 432.0, 797.0, 1365.0, 2631.0, 5701.0, 14216.0, 46953.0, 292614.0, 564945.0, 81464.0, 21250.0, 7918.0, 3582.0, 1659.0, 898.0, 521.0, 266.0, 169.0, 116.0, 77.0, 48.0, 33.0, 20.0, 23.0, 11.0, 9.0, 8.0, 5.0, 8.0, 7.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.1029052734375, -0.09989452362060547, -0.09688377380371094, -0.0938730239868164, -0.09086227416992188, -0.08785152435302734, -0.08484077453613281, -0.08183002471923828, -0.07881927490234375, -0.07580852508544922, -0.07279777526855469, -0.06978702545166016, -0.06677627563476562, -0.0637655258178711, -0.06075477600097656, -0.05774402618408203, -0.0547332763671875, -0.05172252655029297, -0.04871177673339844, -0.045701026916503906, -0.042690277099609375, -0.039679527282714844, -0.03666877746582031, -0.03365802764892578, -0.03064727783203125, -0.02763652801513672, -0.024625778198242188, -0.021615028381347656, -0.018604278564453125, -0.015593528747558594, -0.012582778930664062, -0.009572029113769531, -0.006561279296875, -0.0035505294799804688, -0.0005397796630859375, 0.0024709701538085938, 0.005481719970703125, 0.008492469787597656, 0.011503219604492188, 0.014513969421386719, 0.01752471923828125, 0.02053546905517578, 0.023546218872070312, 0.026556968688964844, 0.029567718505859375, 0.032578468322753906, 0.03558921813964844, 0.03859996795654297, 0.0416107177734375, 0.04462146759033203, 0.04763221740722656, 0.050642967224121094, 0.053653717041015625, 0.056664466857910156, 0.05967521667480469, 0.06268596649169922, 0.06569671630859375, 0.06870746612548828, 0.07171821594238281, 0.07472896575927734, 0.07773971557617188, 0.0807504653930664, 0.08376121520996094, 0.08677196502685547, 0.08978271484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 7.0, 8.0, 8.0, 12.0, 16.0, 27.0, 24.0, 43.0, 66.0, 66.0, 106.0, 89.0, 122.0, 79.0, 81.0, 68.0, 41.0, 35.0, 22.0, 14.0, 11.0, 12.0, 11.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.124113082885742e-05, -7.878616452217102e-05, -7.633119821548462e-05, -7.387623190879822e-05, -7.142126560211182e-05, -6.896629929542542e-05, -6.651133298873901e-05, -6.405636668205261e-05, -6.160140037536621e-05, -5.914643406867981e-05, -5.669146776199341e-05, -5.423650145530701e-05, -5.1781535148620605e-05, -4.9326568841934204e-05, -4.68716025352478e-05, -4.44166362285614e-05, -4.1961669921875e-05, -3.95067036151886e-05, -3.70517373085022e-05, -3.4596771001815796e-05, -3.2141804695129395e-05, -2.9686838388442993e-05, -2.7231872081756592e-05, -2.477690577507019e-05, -2.232193946838379e-05, -1.9866973161697388e-05, -1.7412006855010986e-05, -1.4957040548324585e-05, -1.2502074241638184e-05, -1.0047107934951782e-05, -7.592141628265381e-06, -5.1371753215789795e-06, -2.682209014892578e-06, -2.2724270820617676e-07, 2.2277235984802246e-06, 4.682689905166626e-06, 7.137656211853027e-06, 9.592622518539429e-06, 1.204758882522583e-05, 1.4502555131912231e-05, 1.6957521438598633e-05, 1.9412487745285034e-05, 2.1867454051971436e-05, 2.4322420358657837e-05, 2.6777386665344238e-05, 2.923235297203064e-05, 3.168731927871704e-05, 3.414228558540344e-05, 3.6597251892089844e-05, 3.9052218198776245e-05, 4.1507184505462646e-05, 4.396215081214905e-05, 4.641711711883545e-05, 4.887208342552185e-05, 5.132704973220825e-05, 5.378201603889465e-05, 5.6236982345581055e-05, 5.8691948652267456e-05, 6.114691495895386e-05, 6.360188126564026e-05, 6.605684757232666e-05, 6.851181387901306e-05, 7.096678018569946e-05, 7.342174649238586e-05, 7.587671279907227e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 8.0, 4.0, 11.0, 14.0, 12.0, 17.0, 20.0, 32.0, 43.0, 48.0, 76.0, 107.0, 218.0, 2458.0, 733686.0, 309461.0, 1683.0, 189.0, 111.0, 84.0, 55.0, 41.0, 35.0, 27.0, 17.0, 13.0, 13.0, 8.0, 8.0, 8.0, 7.0, 4.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.50439453125, -0.48860931396484375, -0.4728240966796875, -0.45703887939453125, -0.441253662109375, -0.42546844482421875, -0.4096832275390625, -0.39389801025390625, -0.37811279296875, -0.36232757568359375, -0.3465423583984375, -0.33075714111328125, -0.314971923828125, -0.29918670654296875, -0.2834014892578125, -0.26761627197265625, -0.2518310546875, -0.23604583740234375, -0.2202606201171875, -0.20447540283203125, -0.188690185546875, -0.17290496826171875, -0.1571197509765625, -0.14133453369140625, -0.12554931640625, -0.10976409912109375, -0.0939788818359375, -0.07819366455078125, -0.062408447265625, -0.04662322998046875, -0.0308380126953125, -0.01505279541015625, 0.000732421875, 0.01651763916015625, 0.0323028564453125, 0.04808807373046875, 0.063873291015625, 0.07965850830078125, 0.0954437255859375, 0.11122894287109375, 0.12701416015625, 0.14279937744140625, 0.1585845947265625, 0.17436981201171875, 0.190155029296875, 0.20594024658203125, 0.2217254638671875, 0.23751068115234375, 0.2532958984375, 0.26908111572265625, 0.2848663330078125, 0.30065155029296875, 0.316436767578125, 0.33222198486328125, 0.3480072021484375, 0.36379241943359375, 0.37957763671875, 0.39536285400390625, 0.4111480712890625, 0.42693328857421875, 0.442718505859375, 0.45850372314453125, 0.4742889404296875, 0.49007415771484375, 0.505859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 1.0, 5.0, 5.0, 10.0, 9.0, 9.0, 12.0, 12.0, 19.0, 26.0, 37.0, 44.0, 42.0, 52.0, 73.0, 110.0, 107.0, 78.0, 58.0, 56.0, 36.0, 38.0, 33.0, 31.0, 21.0, 12.0, 7.0, 8.0, 4.0, 9.0, 5.0, 4.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03619384765625, -0.034952640533447266, -0.03371143341064453, -0.0324702262878418, -0.031229019165039062, -0.029987812042236328, -0.028746604919433594, -0.02750539779663086, -0.026264190673828125, -0.02502298355102539, -0.023781776428222656, -0.022540569305419922, -0.021299362182617188, -0.020058155059814453, -0.01881694793701172, -0.017575740814208984, -0.01633453369140625, -0.015093326568603516, -0.013852119445800781, -0.012610912322998047, -0.011369705200195312, -0.010128498077392578, -0.008887290954589844, -0.007646083831787109, -0.006404876708984375, -0.005163669586181641, -0.003922462463378906, -0.002681255340576172, -0.0014400482177734375, -0.00019884109497070312, 0.0010423660278320312, 0.0022835731506347656, 0.0035247802734375, 0.004765987396240234, 0.006007194519042969, 0.007248401641845703, 0.008489608764648438, 0.009730815887451172, 0.010972023010253906, 0.01221323013305664, 0.013454437255859375, 0.01469564437866211, 0.015936851501464844, 0.017178058624267578, 0.018419265747070312, 0.019660472869873047, 0.02090167999267578, 0.022142887115478516, 0.02338409423828125, 0.024625301361083984, 0.02586650848388672, 0.027107715606689453, 0.028348922729492188, 0.029590129852294922, 0.030831336975097656, 0.03207254409790039, 0.033313751220703125, 0.03455495834350586, 0.035796165466308594, 0.03703737258911133, 0.03827857971191406, 0.0395197868347168, 0.04076099395751953, 0.042002201080322266, 0.043243408203125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 83.0, 650.0, 251.0, 20.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.49177360534668, -20.032306671142578, -18.572837829589844, -17.113370895385742, -15.65390396118164, -14.194437026977539, -12.734969139099121, -11.275501251220703, -9.816034317016602, -8.3565673828125, -6.897099494934082, -5.437632083892822, -3.9781646728515625, -2.5186972618103027, -1.059229850769043, 0.400238037109375, 1.8597049713134766, 3.3191723823547363, 4.778639793395996, 6.238107204437256, 7.697574615478516, 9.157041549682617, 10.616509437561035, 12.075977325439453, 13.535444259643555, 14.994911193847656, 16.45438003540039, 17.913846969604492, 19.373313903808594, 20.832780838012695, 22.292247772216797, 23.75171661376953, 25.211181640625, 26.6706485748291, 28.130115509033203, 29.589584350585938, 31.04905128479004, 32.50851821899414, 33.967987060546875, 35.427452087402344, 36.88692092895508, 38.34638977050781, 39.80585479736328, 41.265323638916016, 42.72479248046875, 44.18425750732422, 45.64372634887695, 47.10319519042969, 48.562660217285156, 50.02212905883789, 51.48159408569336, 52.941062927246094, 54.40052795410156, 55.8599967956543, 57.31946563720703, 58.7789306640625, 60.238399505615234, 61.69786834716797, 63.15733337402344, 64.6167984008789, 66.0762710571289, 67.53573608398438, 68.99520111083984, 70.45467376708984, 71.91413879394531]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 16.0, 15.0, 20.0, 27.0, 37.0, 57.0, 57.0, 83.0, 72.0, 81.0, 92.0, 98.0, 77.0, 54.0, 59.0, 35.0, 32.0, 26.0, 22.0, 16.0, 8.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.395238876342773, -7.159341335296631, -6.923443794250488, -6.687546730041504, -6.451649188995361, -6.215751647949219, -5.979854583740234, -5.743957042694092, -5.508059501647949, -5.272161960601807, -5.036264419555664, -4.80036735534668, -4.564469814300537, -4.3285722732543945, -4.09267520904541, -3.8567776679992676, -3.620880126953125, -3.3849825859069824, -3.149085283279419, -2.9131879806518555, -2.677290439605713, -2.4413928985595703, -2.205495595932007, -1.9695981740951538, -1.7337007522583008, -1.4978033304214478, -1.2619059085845947, -1.0260084867477417, -0.7901110649108887, -0.5542136430740356, -0.3183162212371826, -0.08241879940032959, 0.15347909927368164, 0.38937652111053467, 0.6252739429473877, 0.8611713647842407, 1.0970687866210938, 1.3329662084579468, 1.5688636302947998, 1.8047610521316528, 2.040658473968506, 2.2765560150146484, 2.512453317642212, 2.7483506202697754, 2.984248161315918, 3.2201457023620605, 3.456043004989624, 3.6919403076171875, 3.92783784866333, 4.163735389709473, 4.399632453918457, 4.6355299949646, 4.871427536010742, 5.107325077056885, 5.343222618103027, 5.579119682312012, 5.815017223358154, 6.050914764404297, 6.286811828613281, 6.522709369659424, 6.758606910705566, 6.994504451751709, 7.230401992797852, 7.466299057006836, 7.7021965980529785]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 7.0, 9.0, 12.0, 10.0, 10.0, 20.0, 24.0, 39.0, 75.0, 102.0, 151.0, 247.0, 429.0, 958.0, 2526.0, 9509.0, 94334.0, 870493.0, 58399.0, 7244.0, 2076.0, 796.0, 406.0, 216.0, 150.0, 108.0, 54.0, 32.0, 34.0, 23.0, 11.0, 6.0, 10.0, 7.0, 6.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.615234375, -10.27734375, -9.939453125, -9.6015625, -9.263671875, -8.92578125, -8.587890625, -8.25, -7.912109375, -7.57421875, -7.236328125, -6.8984375, -6.560546875, -6.22265625, -5.884765625, -5.546875, -5.208984375, -4.87109375, -4.533203125, -4.1953125, -3.857421875, -3.51953125, -3.181640625, -2.84375, -2.505859375, -2.16796875, -1.830078125, -1.4921875, -1.154296875, -0.81640625, -0.478515625, -0.140625, 0.197265625, 0.53515625, 0.873046875, 1.2109375, 1.548828125, 1.88671875, 2.224609375, 2.5625, 2.900390625, 3.23828125, 3.576171875, 3.9140625, 4.251953125, 4.58984375, 4.927734375, 5.265625, 5.603515625, 5.94140625, 6.279296875, 6.6171875, 6.955078125, 7.29296875, 7.630859375, 7.96875, 8.306640625, 8.64453125, 8.982421875, 9.3203125, 9.658203125, 9.99609375, 10.333984375, 10.671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 7.0, 15.0, 26.0, 46.0, 78.0, 153.0, 156.0, 174.0, 134.0, 90.0, 62.0, 32.0, 17.0, 9.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-143.25, -138.650390625, -134.05078125, -129.451171875, -124.8515625, -120.251953125, -115.65234375, -111.052734375, -106.453125, -101.853515625, -97.25390625, -92.654296875, -88.0546875, -83.455078125, -78.85546875, -74.255859375, -69.65625, -65.056640625, -60.45703125, -55.857421875, -51.2578125, -46.658203125, -42.05859375, -37.458984375, -32.859375, -28.259765625, -23.66015625, -19.060546875, -14.4609375, -9.861328125, -5.26171875, -0.662109375, 3.9375, 8.537109375, 13.13671875, 17.736328125, 22.3359375, 26.935546875, 31.53515625, 36.134765625, 40.734375, 45.333984375, 49.93359375, 54.533203125, 59.1328125, 63.732421875, 68.33203125, 72.931640625, 77.53125, 82.130859375, 86.73046875, 91.330078125, 95.9296875, 100.529296875, 105.12890625, 109.728515625, 114.328125, 118.927734375, 123.52734375, 128.126953125, 132.7265625, 137.326171875, 141.92578125, 146.525390625, 151.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 10.0, 17.0, 22.0, 23.0, 49.0, 82.0, 124.0, 247.0, 528.0, 5342.0, 1038126.0, 2960.0, 456.0, 216.0, 123.0, 81.0, 52.0, 26.0, 16.0, 8.0, 4.0, 5.0, 2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.3125, -48.65869140625, -47.0048828125, -45.35107421875, -43.697265625, -42.04345703125, -40.3896484375, -38.73583984375, -37.08203125, -35.42822265625, -33.7744140625, -32.12060546875, -30.466796875, -28.81298828125, -27.1591796875, -25.50537109375, -23.8515625, -22.19775390625, -20.5439453125, -18.89013671875, -17.236328125, -15.58251953125, -13.9287109375, -12.27490234375, -10.62109375, -8.96728515625, -7.3134765625, -5.65966796875, -4.005859375, -2.35205078125, -0.6982421875, 0.95556640625, 2.609375, 4.26318359375, 5.9169921875, 7.57080078125, 9.224609375, 10.87841796875, 12.5322265625, 14.18603515625, 15.83984375, 17.49365234375, 19.1474609375, 20.80126953125, 22.455078125, 24.10888671875, 25.7626953125, 27.41650390625, 29.0703125, 30.72412109375, 32.3779296875, 34.03173828125, 35.685546875, 37.33935546875, 38.9931640625, 40.64697265625, 42.30078125, 43.95458984375, 45.6083984375, 47.26220703125, 48.916015625, 50.56982421875, 52.2236328125, 53.87744140625, 55.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 9.0, 11.0, 27.0, 39.0, 57.0, 80.0, 107.0, 113.0, 138.0, 118.0, 84.0, 64.0, 45.0, 39.0, 21.0, 15.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-121.25, -117.23828125, -113.2265625, -109.21484375, -105.203125, -101.19140625, -97.1796875, -93.16796875, -89.15625, -85.14453125, -81.1328125, -77.12109375, -73.109375, -69.09765625, -65.0859375, -61.07421875, -57.0625, -53.05078125, -49.0390625, -45.02734375, -41.015625, -37.00390625, -32.9921875, -28.98046875, -24.96875, -20.95703125, -16.9453125, -12.93359375, -8.921875, -4.91015625, -0.8984375, 3.11328125, 7.125, 11.13671875, 15.1484375, 19.16015625, 23.171875, 27.18359375, 31.1953125, 35.20703125, 39.21875, 43.23046875, 47.2421875, 51.25390625, 55.265625, 59.27734375, 63.2890625, 67.30078125, 71.3125, 75.32421875, 79.3359375, 83.34765625, 87.359375, 91.37109375, 95.3828125, 99.39453125, 103.40625, 107.41796875, 111.4296875, 115.44140625, 119.453125, 123.46484375, 127.4765625, 131.48828125, 135.5]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 10.0, 10.0, 17.0, 42.0, 65.0, 123.0, 294.0, 663.0, 1684.0, 4608.0, 24628.0, 998832.0, 12214.0, 3167.0, 1188.0, 504.0, 224.0, 107.0, 46.0, 24.0, 19.0, 14.0, 13.0, 6.0, 8.0, 0.0, 6.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.279296875, -1.2430877685546875, -1.206878662109375, -1.1706695556640625, -1.13446044921875, -1.0982513427734375, -1.062042236328125, -1.0258331298828125, -0.9896240234375, -0.9534149169921875, -0.917205810546875, -0.8809967041015625, -0.84478759765625, -0.8085784912109375, -0.772369384765625, -0.7361602783203125, -0.699951171875, -0.6637420654296875, -0.627532958984375, -0.5913238525390625, -0.55511474609375, -0.5189056396484375, -0.482696533203125, -0.4464874267578125, -0.4102783203125, -0.3740692138671875, -0.337860107421875, -0.3016510009765625, -0.26544189453125, -0.2292327880859375, -0.193023681640625, -0.1568145751953125, -0.12060546875, -0.0843963623046875, -0.048187255859375, -0.0119781494140625, 0.02423095703125, 0.0604400634765625, 0.096649169921875, 0.1328582763671875, 0.1690673828125, 0.2052764892578125, 0.241485595703125, 0.2776947021484375, 0.31390380859375, 0.3501129150390625, 0.386322021484375, 0.4225311279296875, 0.458740234375, 0.4949493408203125, 0.531158447265625, 0.5673675537109375, 0.60357666015625, 0.6397857666015625, 0.675994873046875, 0.7122039794921875, 0.7484130859375, 0.7846221923828125, 0.820831298828125, 0.8570404052734375, 0.89324951171875, 0.9294586181640625, 0.965667724609375, 1.0018768310546875, 1.0380859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 10.0, 13.0, 24.0, 29.0, 58.0, 221.0, 430.0, 123.0, 41.0, 24.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012683868408203125, -0.00012218765914440155, -0.00011753663420677185, -0.00011288560926914215, -0.00010823458433151245, -0.00010358355939388275, -9.893253445625305e-05, -9.428150951862335e-05, -8.963048458099365e-05, -8.497945964336395e-05, -8.032843470573425e-05, -7.567740976810455e-05, -7.102638483047485e-05, -6.637535989284515e-05, -6.172433495521545e-05, -5.7073310017585754e-05, -5.2422285079956055e-05, -4.7771260142326355e-05, -4.3120235204696655e-05, -3.8469210267066956e-05, -3.3818185329437256e-05, -2.9167160391807556e-05, -2.4516135454177856e-05, -1.9865110516548157e-05, -1.5214085578918457e-05, -1.0563060641288757e-05, -5.912035703659058e-06, -1.261010766029358e-06, 3.390014171600342e-06, 8.041039109230042e-06, 1.2692064046859741e-05, 1.734308898448944e-05, 2.199411392211914e-05, 2.664513885974884e-05, 3.129616379737854e-05, 3.594718873500824e-05, 4.059821367263794e-05, 4.524923861026764e-05, 4.990026354789734e-05, 5.455128848552704e-05, 5.920231342315674e-05, 6.385333836078644e-05, 6.850436329841614e-05, 7.315538823604584e-05, 7.780641317367554e-05, 8.245743811130524e-05, 8.710846304893494e-05, 9.175948798656464e-05, 9.641051292419434e-05, 0.00010106153786182404, 0.00010571256279945374, 0.00011036358773708344, 0.00011501461267471313, 0.00011966563761234283, 0.00012431666254997253, 0.00012896768748760223, 0.00013361871242523193, 0.00013826973736286163, 0.00014292076230049133, 0.00014757178723812103, 0.00015222281217575073, 0.00015687383711338043, 0.00016152486205101013, 0.00016617588698863983, 0.00017082691192626953]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 5.0, 7.0, 8.0, 23.0, 56.0, 173.0, 1071.0, 10882.0, 1028449.0, 6872.0, 769.0, 140.0, 47.0, 15.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9609375, -2.869598388671875, -2.77825927734375, -2.686920166015625, -2.5955810546875, -2.504241943359375, -2.41290283203125, -2.321563720703125, -2.230224609375, -2.138885498046875, -2.04754638671875, -1.956207275390625, -1.8648681640625, -1.773529052734375, -1.68218994140625, -1.590850830078125, -1.49951171875, -1.408172607421875, -1.31683349609375, -1.225494384765625, -1.1341552734375, -1.042816162109375, -0.95147705078125, -0.860137939453125, -0.768798828125, -0.677459716796875, -0.58612060546875, -0.494781494140625, -0.4034423828125, -0.312103271484375, -0.22076416015625, -0.129425048828125, -0.0380859375, 0.053253173828125, 0.14459228515625, 0.235931396484375, 0.3272705078125, 0.418609619140625, 0.50994873046875, 0.601287841796875, 0.692626953125, 0.783966064453125, 0.87530517578125, 0.966644287109375, 1.0579833984375, 1.149322509765625, 1.24066162109375, 1.332000732421875, 1.42333984375, 1.514678955078125, 1.60601806640625, 1.697357177734375, 1.7886962890625, 1.880035400390625, 1.97137451171875, 2.062713623046875, 2.154052734375, 2.245391845703125, 2.33673095703125, 2.428070068359375, 2.5194091796875, 2.610748291015625, 2.70208740234375, 2.793426513671875, 2.884765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 6.0, 4.0, 2.0, 5.0, 7.0, 9.0, 31.0, 461.0, 402.0, 40.0, 11.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.404296875, -0.3916587829589844, -0.37902069091796875, -0.3663825988769531, -0.3537445068359375, -0.3411064147949219, -0.32846832275390625, -0.3158302307128906, -0.303192138671875, -0.2905540466308594, -0.27791595458984375, -0.2652778625488281, -0.2526397705078125, -0.24000167846679688, -0.22736358642578125, -0.21472549438476562, -0.20208740234375, -0.18944931030273438, -0.17681121826171875, -0.16417312622070312, -0.1515350341796875, -0.13889694213867188, -0.12625885009765625, -0.11362075805664062, -0.100982666015625, -0.08834457397460938, -0.07570648193359375, -0.06306838989257812, -0.0504302978515625, -0.037792205810546875, -0.02515411376953125, -0.012516021728515625, 0.0001220703125, 0.012760162353515625, 0.02539825439453125, 0.038036346435546875, 0.0506744384765625, 0.06331253051757812, 0.07595062255859375, 0.08858871459960938, 0.101226806640625, 0.11386489868164062, 0.12650299072265625, 0.13914108276367188, 0.1517791748046875, 0.16441726684570312, 0.17705535888671875, 0.18969345092773438, 0.20233154296875, 0.21496963500976562, 0.22760772705078125, 0.24024581909179688, 0.2528839111328125, 0.2655220031738281, 0.27816009521484375, 0.2907981872558594, 0.303436279296875, 0.3160743713378906, 0.32871246337890625, 0.3413505554199219, 0.3539886474609375, 0.3666267395019531, 0.37926483154296875, 0.3919029235839844, 0.404541015625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.374441623687744, 15.287652969360352, 36.949745178222656, 58.611839294433594, 80.27393341064453, 101.93602752685547, 123.5981216430664, 145.26022338867188, 166.9223175048828, 188.58441162109375, 210.2465057373047, 231.90859985351562, 253.57069396972656, 275.2327880859375, 296.8948974609375, 318.5569763183594, 340.21905517578125, 361.88116455078125, 383.5432434082031, 405.205322265625, 426.867431640625, 448.529541015625, 470.1916198730469, 491.85369873046875, 513.5158081054688, 535.1779174804688, 556.8399658203125, 578.5020751953125, 600.1641845703125, 621.8262939453125, 643.4884033203125, 665.1504516601562, 686.8126220703125, 708.4747314453125, 730.1368408203125, 751.7988891601562, 773.4609985351562, 795.1231079101562, 816.78515625, 838.447265625, 860.109375, 881.771484375, 903.43359375, 925.0956420898438, 946.7577514648438, 968.4198608398438, 990.0819091796875, 1011.7440185546875, 1033.4061279296875, 1055.0682373046875, 1076.7303466796875, 1098.3924560546875, 1120.054443359375, 1141.716552734375, 1163.378662109375, 1185.040771484375, 1206.702880859375, 1228.364990234375, 1250.027099609375, 1271.689208984375, 1293.351318359375, 1315.0133056640625, 1336.6754150390625, 1358.3375244140625, 1379.9996337890625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 18.0, 32.0, 45.0, 47.0, 40.0, 50.0, 69.0, 96.0, 75.0, 81.0, 99.0, 77.0, 58.0, 70.0, 52.0, 22.0, 16.0, 14.0, 12.0, 12.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.20059204101562, -131.21047973632812, -127.22036743164062, -123.23025512695312, -119.2401351928711, -115.2500228881836, -111.2599105834961, -107.2697982788086, -103.27967834472656, -99.28956604003906, -95.29945373535156, -91.30934143066406, -87.31922149658203, -83.32910919189453, -79.33899688720703, -75.34888458251953, -71.35877227783203, -67.36865997314453, -63.378543853759766, -59.388431549072266, -55.3983154296875, -51.408203125, -47.4180908203125, -43.427978515625, -39.437862396240234, -35.447750091552734, -31.45763397216797, -27.46752166748047, -23.477407455444336, -19.487293243408203, -15.497180938720703, -11.50706672668457, -7.5169525146484375, -3.526838779449463, 0.4632749557495117, 4.453388214111328, 8.443502426147461, 12.433616638183594, 16.423728942871094, 20.413843154907227, 24.40395736694336, 28.394071578979492, 32.384185791015625, 36.374298095703125, 40.364410400390625, 44.35452651977539, 48.34463882446289, 52.334754943847656, 56.324867248535156, 60.314979553222656, 64.30509185791016, 68.29521179199219, 72.28532409667969, 76.27543640136719, 80.26554870605469, 84.25566101074219, 88.24577331542969, 92.23588562011719, 96.22599792480469, 100.21611022949219, 104.20623016357422, 108.19634246826172, 112.18645477294922, 116.17656707763672, 120.16668701171875]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 27.0, 33.0, 60.0, 53.0, 80.0, 103.0, 2619.0, 4190490.0, 483.0, 104.0, 79.0, 64.0, 40.0, 13.0, 19.0, 10.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-85.125, -82.7177734375, -80.310546875, -77.9033203125, -75.49609375, -73.0888671875, -70.681640625, -68.2744140625, -65.8671875, -63.4599609375, -61.052734375, -58.6455078125, -56.23828125, -53.8310546875, -51.423828125, -49.0166015625, -46.609375, -44.2021484375, -41.794921875, -39.3876953125, -36.98046875, -34.5732421875, -32.166015625, -29.7587890625, -27.3515625, -24.9443359375, -22.537109375, -20.1298828125, -17.72265625, -15.3154296875, -12.908203125, -10.5009765625, -8.09375, -5.6865234375, -3.279296875, -0.8720703125, 1.53515625, 3.9423828125, 6.349609375, 8.7568359375, 11.1640625, 13.5712890625, 15.978515625, 18.3857421875, 20.79296875, 23.2001953125, 25.607421875, 28.0146484375, 30.421875, 32.8291015625, 35.236328125, 37.6435546875, 40.05078125, 42.4580078125, 44.865234375, 47.2724609375, 49.6796875, 52.0869140625, 54.494140625, 56.9013671875, 59.30859375, 61.7158203125, 64.123046875, 66.5302734375, 68.9375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 8.0, 5.0, 6.0, 12.0, 5.0, 8.0, 11.0, 12.0, 18.0, 18.0, 20.0, 29.0, 19.0, 27.0, 29.0, 37.0, 39.0, 46.0, 41.0, 41.0, 38.0, 33.0, 36.0, 50.0, 40.0, 37.0, 39.0, 34.0, 47.0, 35.0, 30.0, 26.0, 26.0, 25.0, 8.0, 14.0, 15.0, 10.0, 3.0, 9.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.91851806640625, -2.8135986328125, -2.70867919921875, -2.603759765625, -2.49884033203125, -2.3939208984375, -2.28900146484375, -2.18408203125, -2.07916259765625, -1.9742431640625, -1.86932373046875, -1.764404296875, -1.65948486328125, -1.5545654296875, -1.44964599609375, -1.3447265625, -1.23980712890625, -1.1348876953125, -1.02996826171875, -0.925048828125, -0.82012939453125, -0.7152099609375, -0.61029052734375, -0.50537109375, -0.40045166015625, -0.2955322265625, -0.19061279296875, -0.085693359375, 0.01922607421875, 0.1241455078125, 0.22906494140625, 0.333984375, 0.43890380859375, 0.5438232421875, 0.64874267578125, 0.753662109375, 0.85858154296875, 0.9635009765625, 1.06842041015625, 1.17333984375, 1.27825927734375, 1.3831787109375, 1.48809814453125, 1.593017578125, 1.69793701171875, 1.8028564453125, 1.90777587890625, 2.0126953125, 2.11761474609375, 2.2225341796875, 2.32745361328125, 2.432373046875, 2.53729248046875, 2.6422119140625, 2.74713134765625, 2.85205078125, 2.95697021484375, 3.0618896484375, 3.16680908203125, 3.271728515625, 3.37664794921875, 3.4815673828125, 3.58648681640625, 3.69140625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 14.0, 70.0, 4194054.0, 114.0, 18.0, 6.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-946.0, -925.25, -904.5, -883.75, -863.0, -842.25, -821.5, -800.75, -780.0, -759.25, -738.5, -717.75, -697.0, -676.25, -655.5, -634.75, -614.0, -593.25, -572.5, -551.75, -531.0, -510.25, -489.5, -468.75, -448.0, -427.25, -406.5, -385.75, -365.0, -344.25, -323.5, -302.75, -282.0, -261.25, -240.5, -219.75, -199.0, -178.25, -157.5, -136.75, -116.0, -95.25, -74.5, -53.75, -33.0, -12.25, 8.5, 29.25, 50.0, 70.75, 91.5, 112.25, 133.0, 153.75, 174.5, 195.25, 216.0, 236.75, 257.5, 278.25, 299.0, 319.75, 340.5, 361.25, 382.0]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 16.0, 22.0, 60.0, 162.0, 545.0, 1707.0, 1097.0, 303.0, 84.0, 33.0, 17.0, 10.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.4437255859375, -5.313232421875, -5.1827392578125, -5.05224609375, -4.9217529296875, -4.791259765625, -4.6607666015625, -4.5302734375, -4.3997802734375, -4.269287109375, -4.1387939453125, -4.00830078125, -3.8778076171875, -3.747314453125, -3.6168212890625, -3.486328125, -3.3558349609375, -3.225341796875, -3.0948486328125, -2.96435546875, -2.8338623046875, -2.703369140625, -2.5728759765625, -2.4423828125, -2.3118896484375, -2.181396484375, -2.0509033203125, -1.92041015625, -1.7899169921875, -1.659423828125, -1.5289306640625, -1.3984375, -1.2679443359375, -1.137451171875, -1.0069580078125, -0.87646484375, -0.7459716796875, -0.615478515625, -0.4849853515625, -0.3544921875, -0.2239990234375, -0.093505859375, 0.0369873046875, 0.16748046875, 0.2979736328125, 0.428466796875, 0.5589599609375, 0.689453125, 0.8199462890625, 0.950439453125, 1.0809326171875, 1.21142578125, 1.3419189453125, 1.472412109375, 1.6029052734375, 1.7333984375, 1.8638916015625, 1.994384765625, 2.1248779296875, 2.25537109375, 2.3858642578125, 2.516357421875, 2.6468505859375, 2.77734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 0.0, 3.0, 4.0, 2.0, 14.0, 27.0, 36.0, 47.0, 75.0, 131.0, 144.0, 130.0, 126.0, 103.0, 55.0, 38.0, 27.0, 15.0, 11.0, 4.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.628470420837402, -4.360640048980713, -4.092809677124023, -3.824978828430176, -3.5571484565734863, -3.289318084716797, -3.0214874744415283, -2.7536568641662598, -2.4858264923095703, -2.217996120452881, -1.9501655101776123, -1.6823350191116333, -1.4145045280456543, -1.1466740369796753, -0.8788435459136963, -0.6110130548477173, -0.3431825637817383, -0.07535207271575928, 0.19247841835021973, 0.46030890941619873, 0.7281394004821777, 0.9959698915481567, 1.2638003826141357, 1.5316308736801147, 1.7994613647460938, 2.067291736602783, 2.3351223468780518, 2.6029529571533203, 2.8707833290100098, 3.138613700866699, 3.4064443111419678, 3.6742749214172363, 3.942105293273926, 4.209935665130615, 4.477766036987305, 4.745596885681152, 5.013427257537842, 5.281257629394531, 5.549088478088379, 5.816918849945068, 6.084749221801758, 6.352579593658447, 6.620409965515137, 6.888240814208984, 7.156071186065674, 7.423901557922363, 7.691732406616211, 7.9595627784729, 8.22739315032959, 8.495223999023438, 8.763053894042969, 9.030884742736816, 9.298715591430664, 9.566545486450195, 9.834376335144043, 10.102206230163574, 10.370037078857422, 10.63786792755127, 10.9056978225708, 11.173528671264648, 11.44135856628418, 11.709189414978027, 11.977020263671875, 12.244850158691406, 12.512681007385254]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 11.0, 8.0, 7.0, 8.0, 8.0, 17.0, 12.0, 20.0, 27.0, 28.0, 29.0, 38.0, 43.0, 29.0, 40.0, 32.0, 34.0, 43.0, 42.0, 43.0, 44.0, 47.0, 51.0, 30.0, 30.0, 37.0, 31.0, 28.0, 21.0, 22.0, 21.0, 19.0, 14.0, 13.0, 13.0, 6.0, 10.0, 8.0, 2.0, 4.0, 6.0, 3.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.978426933288574, -3.869804620742798, -3.7611820697784424, -3.652559757232666, -3.5439372062683105, -3.435314893722534, -3.326692581176758, -3.2180700302124023, -3.109447717666626, -3.0008254051208496, -2.892202854156494, -2.7835805416107178, -2.6749582290649414, -2.566335678100586, -2.4577133655548096, -2.349091053009033, -2.2404685020446777, -2.1318461894989014, -2.023223638534546, -1.9146013259887695, -1.8059788942337036, -1.6973564624786377, -1.5887341499328613, -1.4801117181777954, -1.3714892864227295, -1.2628668546676636, -1.1542444229125977, -1.0456221103668213, -0.9369996786117554, -0.8283772468566895, -0.7197548747062683, -0.6111325025558472, -0.5025098323822021, -0.3938874304294586, -0.2852650284767151, -0.17664262652397156, -0.06802022457122803, 0.04060220718383789, 0.14922457933425903, 0.2578469514846802, 0.3664693832397461, 0.4750917851924896, 0.5837141871452332, 0.6923365592956543, 0.8009589910507202, 0.9095814228057861, 1.0182037353515625, 1.1268261671066284, 1.2354485988616943, 1.3440710306167603, 1.4526934623718262, 1.5613157749176025, 1.6699382066726685, 1.7785606384277344, 1.8871829509735107, 1.9958053827285767, 2.1044278144836426, 2.213050127029419, 2.3216726779937744, 2.430294990539551, 2.5389175415039062, 2.6475398540496826, 2.756162166595459, 2.8647847175598145, 2.973407030105591]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 14.0, 7.0, 10.0, 21.0, 25.0, 25.0, 23.0, 64.0, 84.0, 101.0, 129.0, 211.0, 274.0, 372.0, 530.0, 721.0, 1111.0, 1752.0, 3131.0, 6897.0, 20440.0, 93225.0, 617696.0, 241023.0, 38645.0, 10897.0, 4448.0, 2246.0, 1348.0, 883.0, 584.0, 464.0, 306.0, 222.0, 180.0, 109.0, 100.0, 61.0, 48.0, 34.0, 28.0, 22.0, 12.0, 7.0, 7.0, 6.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90576171875, -0.8780899047851562, -0.8504180908203125, -0.8227462768554688, -0.795074462890625, -0.7674026489257812, -0.7397308349609375, -0.7120590209960938, -0.68438720703125, -0.6567153930664062, -0.6290435791015625, -0.6013717651367188, -0.573699951171875, -0.5460281372070312, -0.5183563232421875, -0.49068450927734375, -0.4630126953125, -0.43534088134765625, -0.4076690673828125, -0.37999725341796875, -0.352325439453125, -0.32465362548828125, -0.2969818115234375, -0.26930999755859375, -0.24163818359375, -0.21396636962890625, -0.1862945556640625, -0.15862274169921875, -0.130950927734375, -0.10327911376953125, -0.0756072998046875, -0.04793548583984375, -0.020263671875, 0.00740814208984375, 0.0350799560546875, 0.06275177001953125, 0.090423583984375, 0.11809539794921875, 0.1457672119140625, 0.17343902587890625, 0.20111083984375, 0.22878265380859375, 0.2564544677734375, 0.28412628173828125, 0.311798095703125, 0.33946990966796875, 0.3671417236328125, 0.39481353759765625, 0.4224853515625, 0.45015716552734375, 0.4778289794921875, 0.5055007934570312, 0.533172607421875, 0.5608444213867188, 0.5885162353515625, 0.6161880493164062, 0.64385986328125, 0.6715316772460938, 0.6992034912109375, 0.7268753051757812, 0.754547119140625, 0.7822189331054688, 0.8098907470703125, 0.8375625610351562, 0.865234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 7.0, 7.0, 10.0, 6.0, 16.0, 14.0, 22.0, 18.0, 26.0, 40.0, 42.0, 32.0, 51.0, 48.0, 59.0, 51.0, 48.0, 58.0, 62.0, 45.0, 55.0, 31.0, 39.0, 42.0, 36.0, 21.0, 28.0, 12.0, 14.0, 13.0, 15.0, 6.0, 5.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.15234375, -3.064544677734375, -2.97674560546875, -2.888946533203125, -2.8011474609375, -2.713348388671875, -2.62554931640625, -2.537750244140625, -2.449951171875, -2.362152099609375, -2.27435302734375, -2.186553955078125, -2.0987548828125, -2.010955810546875, -1.92315673828125, -1.835357666015625, -1.74755859375, -1.659759521484375, -1.57196044921875, -1.484161376953125, -1.3963623046875, -1.308563232421875, -1.22076416015625, -1.132965087890625, -1.045166015625, -0.957366943359375, -0.86956787109375, -0.781768798828125, -0.6939697265625, -0.606170654296875, -0.51837158203125, -0.430572509765625, -0.3427734375, -0.254974365234375, -0.16717529296875, -0.079376220703125, 0.0084228515625, 0.096221923828125, 0.18402099609375, 0.271820068359375, 0.359619140625, 0.447418212890625, 0.53521728515625, 0.623016357421875, 0.7108154296875, 0.798614501953125, 0.88641357421875, 0.974212646484375, 1.06201171875, 1.149810791015625, 1.23760986328125, 1.325408935546875, 1.4132080078125, 1.501007080078125, 1.58880615234375, 1.676605224609375, 1.764404296875, 1.852203369140625, 1.94000244140625, 2.027801513671875, 2.1156005859375, 2.203399658203125, 2.29119873046875, 2.378997802734375, 2.466796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 9.0, 16.0, 22.0, 21.0, 45.0, 75.0, 104.0, 160.0, 230.0, 398.0, 734.0, 1048.0, 1960.0, 3097.0, 5413.0, 9854.0, 18274.0, 35884.0, 77309.0, 188147.0, 350241.0, 195338.0, 80279.0, 37143.0, 18917.0, 10205.0, 5718.0, 3228.0, 1829.0, 1098.0, 642.0, 421.0, 265.0, 137.0, 100.0, 78.0, 37.0, 24.0, 16.0, 14.0, 6.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.25439453125, -0.24657249450683594, -0.23875045776367188, -0.2309284210205078, -0.22310638427734375, -0.2152843475341797, -0.20746231079101562, -0.19964027404785156, -0.1918182373046875, -0.18399620056152344, -0.17617416381835938, -0.1683521270751953, -0.16053009033203125, -0.1527080535888672, -0.14488601684570312, -0.13706398010253906, -0.129241943359375, -0.12141990661621094, -0.11359786987304688, -0.10577583312988281, -0.09795379638671875, -0.09013175964355469, -0.08230972290039062, -0.07448768615722656, -0.0666656494140625, -0.05884361267089844, -0.051021575927734375, -0.04319953918457031, -0.03537750244140625, -0.027555465698242188, -0.019733428955078125, -0.011911392211914062, -0.00408935546875, 0.0037326812744140625, 0.011554718017578125, 0.019376754760742188, 0.02719879150390625, 0.03502082824707031, 0.042842864990234375, 0.05066490173339844, 0.0584869384765625, 0.06630897521972656, 0.07413101196289062, 0.08195304870605469, 0.08977508544921875, 0.09759712219238281, 0.10541915893554688, 0.11324119567871094, 0.121063232421875, 0.12888526916503906, 0.13670730590820312, 0.1445293426513672, 0.15235137939453125, 0.1601734161376953, 0.16799545288085938, 0.17581748962402344, 0.1836395263671875, 0.19146156311035156, 0.19928359985351562, 0.2071056365966797, 0.21492767333984375, 0.2227497100830078, 0.23057174682617188, 0.23839378356933594, 0.2462158203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 0.0, 8.0, 9.0, 9.0, 9.0, 10.0, 12.0, 9.0, 14.0, 14.0, 16.0, 25.0, 37.0, 26.0, 31.0, 33.0, 45.0, 47.0, 38.0, 40.0, 46.0, 53.0, 45.0, 56.0, 42.0, 41.0, 31.0, 39.0, 31.0, 27.0, 22.0, 26.0, 20.0, 22.0, 8.0, 14.0, 18.0, 10.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.48828125, -4.3572998046875, -4.226318359375, -4.0953369140625, -3.96435546875, -3.8333740234375, -3.702392578125, -3.5714111328125, -3.4404296875, -3.3094482421875, -3.178466796875, -3.0474853515625, -2.91650390625, -2.7855224609375, -2.654541015625, -2.5235595703125, -2.392578125, -2.2615966796875, -2.130615234375, -1.9996337890625, -1.86865234375, -1.7376708984375, -1.606689453125, -1.4757080078125, -1.3447265625, -1.2137451171875, -1.082763671875, -0.9517822265625, -0.82080078125, -0.6898193359375, -0.558837890625, -0.4278564453125, -0.296875, -0.1658935546875, -0.034912109375, 0.0960693359375, 0.22705078125, 0.3580322265625, 0.489013671875, 0.6199951171875, 0.7509765625, 0.8819580078125, 1.012939453125, 1.1439208984375, 1.27490234375, 1.4058837890625, 1.536865234375, 1.6678466796875, 1.798828125, 1.9298095703125, 2.060791015625, 2.1917724609375, 2.32275390625, 2.4537353515625, 2.584716796875, 2.7156982421875, 2.8466796875, 2.9776611328125, 3.108642578125, 3.2396240234375, 3.37060546875, 3.5015869140625, 3.632568359375, 3.7635498046875, 3.89453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 10.0, 10.0, 17.0, 25.0, 38.0, 56.0, 97.0, 157.0, 231.0, 381.0, 701.0, 1168.0, 2275.0, 4949.0, 12325.0, 38067.0, 147523.0, 576154.0, 195972.0, 44775.0, 13912.0, 4941.0, 2128.0, 1058.0, 615.0, 347.0, 199.0, 128.0, 82.0, 68.0, 30.0, 27.0, 24.0, 16.0, 10.0, 12.0, 6.0, 2.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.04827880859375, -0.04692220687866211, -0.04556560516357422, -0.04420900344848633, -0.04285240173339844, -0.04149580001831055, -0.040139198303222656, -0.038782596588134766, -0.037425994873046875, -0.036069393157958984, -0.034712791442871094, -0.0333561897277832, -0.03199958801269531, -0.030642986297607422, -0.02928638458251953, -0.02792978286743164, -0.02657318115234375, -0.02521657943725586, -0.02385997772216797, -0.022503376007080078, -0.021146774291992188, -0.019790172576904297, -0.018433570861816406, -0.017076969146728516, -0.015720367431640625, -0.014363765716552734, -0.013007164001464844, -0.011650562286376953, -0.010293960571289062, -0.008937358856201172, -0.007580757141113281, -0.006224155426025391, -0.0048675537109375, -0.0035109519958496094, -0.0021543502807617188, -0.0007977485656738281, 0.0005588531494140625, 0.0019154548645019531, 0.0032720565795898438, 0.004628658294677734, 0.005985260009765625, 0.007341861724853516, 0.008698463439941406, 0.010055065155029297, 0.011411666870117188, 0.012768268585205078, 0.014124870300292969, 0.01548147201538086, 0.01683807373046875, 0.01819467544555664, 0.01955127716064453, 0.020907878875732422, 0.022264480590820312, 0.023621082305908203, 0.024977684020996094, 0.026334285736083984, 0.027690887451171875, 0.029047489166259766, 0.030404090881347656, 0.03176069259643555, 0.03311729431152344, 0.03447389602661133, 0.03583049774169922, 0.03718709945678711, 0.038543701171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 9.0, 18.0, 18.0, 23.0, 25.0, 61.0, 62.0, 79.0, 102.0, 134.0, 120.0, 84.0, 70.0, 52.0, 46.0, 30.0, 17.0, 14.0, 13.0, 5.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.786252975463867e-05, -4.618149250745773e-05, -4.4500455260276794e-05, -4.2819418013095856e-05, -4.113838076591492e-05, -3.945734351873398e-05, -3.777630627155304e-05, -3.60952690243721e-05, -3.441423177719116e-05, -3.2733194530010223e-05, -3.1052157282829285e-05, -2.9371120035648346e-05, -2.7690082788467407e-05, -2.600904554128647e-05, -2.432800829410553e-05, -2.264697104692459e-05, -2.0965933799743652e-05, -1.9284896552562714e-05, -1.7603859305381775e-05, -1.5922822058200836e-05, -1.4241784811019897e-05, -1.2560747563838959e-05, -1.087971031665802e-05, -9.198673069477081e-06, -7.517635822296143e-06, -5.836598575115204e-06, -4.155561327934265e-06, -2.4745240807533264e-06, -7.934868335723877e-07, 8.87550413608551e-07, 2.5685876607894897e-06, 4.2496249079704285e-06, 5.930662155151367e-06, 7.611699402332306e-06, 9.292736649513245e-06, 1.0973773896694183e-05, 1.2654811143875122e-05, 1.433584839105606e-05, 1.6016885638237e-05, 1.7697922885417938e-05, 1.9378960132598877e-05, 2.1059997379779816e-05, 2.2741034626960754e-05, 2.4422071874141693e-05, 2.6103109121322632e-05, 2.778414636850357e-05, 2.946518361568451e-05, 3.114622086286545e-05, 3.282725811004639e-05, 3.4508295357227325e-05, 3.6189332604408264e-05, 3.78703698515892e-05, 3.955140709877014e-05, 4.123244434595108e-05, 4.291348159313202e-05, 4.459451884031296e-05, 4.6275556087493896e-05, 4.7956593334674835e-05, 4.9637630581855774e-05, 5.131866782903671e-05, 5.299970507621765e-05, 5.468074232339859e-05, 5.636177957057953e-05, 5.804281681776047e-05, 5.9723854064941406e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 7.0, 4.0, 10.0, 3.0, 19.0, 18.0, 23.0, 18.0, 24.0, 53.0, 63.0, 95.0, 184.0, 417.0, 1850.0, 15640.0, 552790.0, 459717.0, 14968.0, 1834.0, 410.0, 143.0, 74.0, 44.0, 45.0, 27.0, 21.0, 16.0, 9.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1478271484375, -0.14334487915039062, -0.13886260986328125, -0.13438034057617188, -0.1298980712890625, -0.12541580200195312, -0.12093353271484375, -0.11645126342773438, -0.111968994140625, -0.10748672485351562, -0.10300445556640625, -0.09852218627929688, -0.0940399169921875, -0.08955764770507812, -0.08507537841796875, -0.08059310913085938, -0.07611083984375, -0.07162857055664062, -0.06714630126953125, -0.06266403198242188, -0.0581817626953125, -0.053699493408203125, -0.04921722412109375, -0.044734954833984375, -0.040252685546875, -0.035770416259765625, -0.03128814697265625, -0.026805877685546875, -0.0223236083984375, -0.017841339111328125, -0.01335906982421875, -0.008876800537109375, -0.00439453125, 8.7738037109375e-05, 0.00457000732421875, 0.009052276611328125, 0.0135345458984375, 0.018016815185546875, 0.02249908447265625, 0.026981353759765625, 0.031463623046875, 0.035945892333984375, 0.04042816162109375, 0.044910430908203125, 0.0493927001953125, 0.053874969482421875, 0.05835723876953125, 0.06283950805664062, 0.06732177734375, 0.07180404663085938, 0.07628631591796875, 0.08076858520507812, 0.0852508544921875, 0.08973312377929688, 0.09421539306640625, 0.09869766235351562, 0.103179931640625, 0.10766220092773438, 0.11214447021484375, 0.11662673950195312, 0.1211090087890625, 0.12559127807617188, 0.13007354736328125, 0.13455581665039062, 0.1390380859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 7.0, 8.0, 7.0, 10.0, 10.0, 14.0, 14.0, 35.0, 25.0, 33.0, 45.0, 52.0, 56.0, 77.0, 97.0, 104.0, 84.0, 74.0, 53.0, 46.0, 32.0, 29.0, 21.0, 18.0, 9.0, 3.0, 6.0, 8.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01367950439453125, -0.013254523277282715, -0.01282954216003418, -0.012404561042785645, -0.01197957992553711, -0.011554598808288574, -0.011129617691040039, -0.010704636573791504, -0.010279655456542969, -0.009854674339294434, -0.009429693222045898, -0.009004712104797363, -0.008579730987548828, -0.008154749870300293, -0.007729768753051758, -0.007304787635803223, -0.0068798065185546875, -0.006454825401306152, -0.006029844284057617, -0.005604863166809082, -0.005179882049560547, -0.004754900932312012, -0.0043299198150634766, -0.0039049386978149414, -0.0034799575805664062, -0.003054976463317871, -0.002629995346069336, -0.0022050142288208008, -0.0017800331115722656, -0.0013550519943237305, -0.0009300708770751953, -0.0005050897598266602, -8.0108642578125e-05, 0.00034487247467041016, 0.0007698535919189453, 0.0011948347091674805, 0.0016198158264160156, 0.0020447969436645508, 0.002469778060913086, 0.002894759178161621, 0.0033197402954101562, 0.0037447214126586914, 0.0041697025299072266, 0.004594683647155762, 0.005019664764404297, 0.005444645881652832, 0.005869626998901367, 0.006294608116149902, 0.0067195892333984375, 0.007144570350646973, 0.007569551467895508, 0.007994532585144043, 0.008419513702392578, 0.008844494819641113, 0.009269475936889648, 0.009694457054138184, 0.010119438171386719, 0.010544419288635254, 0.010969400405883789, 0.011394381523132324, 0.01181936264038086, 0.012244343757629395, 0.01266932487487793, 0.013094305992126465, 0.013519287109375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 3.0, 12.0, 26.0, 31.0, 57.0, 80.0, 134.0, 158.0, 140.0, 132.0, 73.0, 48.0, 39.0, 19.0, 14.0, 9.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.478943347930908, -6.303932189941406, -6.128920555114746, -5.953909397125244, -5.778898239135742, -5.603886604309082, -5.42887544631958, -5.253864288330078, -5.078852653503418, -4.903841495513916, -4.728829860687256, -4.553818702697754, -4.378807067871094, -4.203795909881592, -4.02878475189209, -3.853773355484009, -3.6787619590759277, -3.5037505626678467, -3.3287391662597656, -3.1537280082702637, -2.9787166118621826, -2.8037052154541016, -2.6286940574645996, -2.4536826610565186, -2.2786712646484375, -2.1036598682403564, -1.928648591041565, -1.7536373138427734, -1.5786259174346924, -1.4036145210266113, -1.2286032438278198, -1.0535919666290283, -0.8785805702209473, -0.703569233417511, -0.5285578966140747, -0.3535465598106384, -0.17853522300720215, -0.003523886203765869, 0.1714874505996704, 0.3464987277984619, 0.521510124206543, 0.6965214610099792, 0.8715327978134155, 1.046544075012207, 1.221555471420288, 1.3965668678283691, 1.5715781450271606, 1.7465894222259521, 1.9216008186340332, 2.0966122150421143, 2.2716236114501953, 2.4466347694396973, 2.6216461658477783, 2.7966575622558594, 2.9716687202453613, 3.1466801166534424, 3.3216915130615234, 3.4967029094696045, 3.6717143058776855, 3.8467254638671875, 4.021737098693848, 4.19674825668335, 4.371759414672852, 4.546771049499512, 4.721782207489014]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 13.0, 8.0, 6.0, 11.0, 11.0, 26.0, 20.0, 27.0, 43.0, 40.0, 35.0, 46.0, 34.0, 43.0, 50.0, 47.0, 47.0, 46.0, 52.0, 51.0, 47.0, 37.0, 34.0, 27.0, 28.0, 24.0, 17.0, 23.0, 11.0, 16.0, 12.0, 10.0, 8.0, 6.0, 8.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6686439514160156, -2.5930778980255127, -2.5175118446350098, -2.4419455528259277, -2.366379499435425, -2.290813446044922, -2.215247392654419, -2.139681339263916, -2.064115047454834, -1.988548994064331, -1.9129828214645386, -1.8374167680740356, -1.7618505954742432, -1.6862845420837402, -1.6107184886932373, -1.5351524353027344, -1.4595863819122314, -1.3840203285217285, -1.308454155921936, -1.232888102531433, -1.1573219299316406, -1.0817558765411377, -1.0061898231506348, -0.9306237101554871, -0.8550575971603394, -0.7794914841651917, -0.703925371170044, -0.628359317779541, -0.5527932047843933, -0.4772270917892456, -0.4016610085964203, -0.32609492540359497, -0.25052881240844727, -0.17496271431446075, -0.09939661622047424, -0.023830518126487732, 0.05173557996749878, 0.12730169296264648, 0.2028677761554718, 0.2784338593482971, 0.3539999723434448, 0.42956608533859253, 0.5051321983337402, 0.5806982517242432, 0.6562643647193909, 0.7318304777145386, 0.8073965311050415, 0.8829626441001892, 0.9585287570953369, 1.0340948104858398, 1.1096609830856323, 1.1852270364761353, 1.2607932090759277, 1.3363592624664307, 1.4119253158569336, 1.4874913692474365, 1.563057541847229, 1.638623595237732, 1.7141897678375244, 1.7897558212280273, 1.8653218746185303, 1.9408880472183228, 2.0164542198181152, 2.092020273208618, 2.167586326599121]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 9.0, 5.0, 11.0, 11.0, 21.0, 21.0, 32.0, 41.0, 76.0, 117.0, 185.0, 296.0, 528.0, 934.0, 1729.0, 3102.0, 6249.0, 13166.0, 32359.0, 93957.0, 370963.0, 371612.0, 94059.0, 32302.0, 13300.0, 6336.0, 3076.0, 1730.0, 914.0, 553.0, 304.0, 180.0, 136.0, 84.0, 47.0, 25.0, 25.0, 12.0, 9.0, 9.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8681640625, -1.8058929443359375, -1.743621826171875, -1.6813507080078125, -1.61907958984375, -1.5568084716796875, -1.494537353515625, -1.4322662353515625, -1.3699951171875, -1.3077239990234375, -1.245452880859375, -1.1831817626953125, -1.12091064453125, -1.0586395263671875, -0.996368408203125, -0.9340972900390625, -0.871826171875, -0.8095550537109375, -0.747283935546875, -0.6850128173828125, -0.62274169921875, -0.5604705810546875, -0.498199462890625, -0.4359283447265625, -0.3736572265625, -0.3113861083984375, -0.249114990234375, -0.1868438720703125, -0.12457275390625, -0.0623016357421875, -3.0517578125e-05, 0.0622406005859375, 0.12451171875, 0.1867828369140625, 0.249053955078125, 0.3113250732421875, 0.37359619140625, 0.4358673095703125, 0.498138427734375, 0.5604095458984375, 0.6226806640625, 0.6849517822265625, 0.747222900390625, 0.8094940185546875, 0.87176513671875, 0.9340362548828125, 0.996307373046875, 1.0585784912109375, 1.120849609375, 1.1831207275390625, 1.245391845703125, 1.3076629638671875, 1.36993408203125, 1.4322052001953125, 1.494476318359375, 1.5567474365234375, 1.6190185546875, 1.6812896728515625, 1.743560791015625, 1.8058319091796875, 1.86810302734375, 1.9303741455078125, 1.992645263671875, 2.0549163818359375, 2.1171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 9.0, 3.0, 8.0, 19.0, 16.0, 25.0, 33.0, 45.0, 48.0, 57.0, 61.0, 78.0, 77.0, 78.0, 79.0, 60.0, 80.0, 53.0, 36.0, 39.0, 35.0, 32.0, 15.0, 5.0, 5.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.989501953125, -15.49462890625, -14.999755859375, -14.5048828125, -14.010009765625, -13.51513671875, -13.020263671875, -12.525390625, -12.030517578125, -11.53564453125, -11.040771484375, -10.5458984375, -10.051025390625, -9.55615234375, -9.061279296875, -8.56640625, -8.071533203125, -7.57666015625, -7.081787109375, -6.5869140625, -6.092041015625, -5.59716796875, -5.102294921875, -4.607421875, -4.112548828125, -3.61767578125, -3.122802734375, -2.6279296875, -2.133056640625, -1.63818359375, -1.143310546875, -0.6484375, -0.153564453125, 0.34130859375, 0.836181640625, 1.3310546875, 1.825927734375, 2.32080078125, 2.815673828125, 3.310546875, 3.805419921875, 4.30029296875, 4.795166015625, 5.2900390625, 5.784912109375, 6.27978515625, 6.774658203125, 7.26953125, 7.764404296875, 8.25927734375, 8.754150390625, 9.2490234375, 9.743896484375, 10.23876953125, 10.733642578125, 11.228515625, 11.723388671875, 12.21826171875, 12.713134765625, 13.2080078125, 13.702880859375, 14.19775390625, 14.692626953125, 15.1875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 5.0, 7.0, 11.0, 18.0, 29.0, 49.0, 73.0, 155.0, 4055.0, 1043664.0, 208.0, 110.0, 59.0, 41.0, 21.0, 13.0, 6.0, 11.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.9375, -62.455078125, -59.97265625, -57.490234375, -55.0078125, -52.525390625, -50.04296875, -47.560546875, -45.078125, -42.595703125, -40.11328125, -37.630859375, -35.1484375, -32.666015625, -30.18359375, -27.701171875, -25.21875, -22.736328125, -20.25390625, -17.771484375, -15.2890625, -12.806640625, -10.32421875, -7.841796875, -5.359375, -2.876953125, -0.39453125, 2.087890625, 4.5703125, 7.052734375, 9.53515625, 12.017578125, 14.5, 16.982421875, 19.46484375, 21.947265625, 24.4296875, 26.912109375, 29.39453125, 31.876953125, 34.359375, 36.841796875, 39.32421875, 41.806640625, 44.2890625, 46.771484375, 49.25390625, 51.736328125, 54.21875, 56.701171875, 59.18359375, 61.666015625, 64.1484375, 66.630859375, 69.11328125, 71.595703125, 74.078125, 76.560546875, 79.04296875, 81.525390625, 84.0078125, 86.490234375, 88.97265625, 91.455078125, 93.9375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 5.0, 7.0, 11.0, 18.0, 28.0, 51.0, 68.0, 120.0, 146.0, 156.0, 125.0, 97.0, 61.0, 39.0, 22.0, 13.0, 5.0, 11.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.171875, -25.171630859375, -24.17138671875, -23.171142578125, -22.1708984375, -21.170654296875, -20.17041015625, -19.170166015625, -18.169921875, -17.169677734375, -16.16943359375, -15.169189453125, -14.1689453125, -13.168701171875, -12.16845703125, -11.168212890625, -10.16796875, -9.167724609375, -8.16748046875, -7.167236328125, -6.1669921875, -5.166748046875, -4.16650390625, -3.166259765625, -2.166015625, -1.165771484375, -0.16552734375, 0.834716796875, 1.8349609375, 2.835205078125, 3.83544921875, 4.835693359375, 5.8359375, 6.836181640625, 7.83642578125, 8.836669921875, 9.8369140625, 10.837158203125, 11.83740234375, 12.837646484375, 13.837890625, 14.838134765625, 15.83837890625, 16.838623046875, 17.8388671875, 18.839111328125, 19.83935546875, 20.839599609375, 21.83984375, 22.840087890625, 23.84033203125, 24.840576171875, 25.8408203125, 26.841064453125, 27.84130859375, 28.841552734375, 29.841796875, 30.842041015625, 31.84228515625, 32.842529296875, 33.8427734375, 34.843017578125, 35.84326171875, 36.843505859375, 37.84375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 20.0, 24.0, 24.0, 31.0, 71.0, 117.0, 205.0, 470.0, 1214.0, 3299.0, 11105.0, 120995.0, 885967.0, 17524.0, 4542.0, 1644.0, 636.0, 283.0, 144.0, 74.0, 43.0, 28.0, 22.0, 16.0, 9.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90576171875, -0.8735885620117188, -0.8414154052734375, -0.8092422485351562, -0.777069091796875, -0.7448959350585938, -0.7127227783203125, -0.6805496215820312, -0.64837646484375, -0.6162033081054688, -0.5840301513671875, -0.5518569946289062, -0.519683837890625, -0.48751068115234375, -0.4553375244140625, -0.42316436767578125, -0.3909912109375, -0.35881805419921875, -0.3266448974609375, -0.29447174072265625, -0.262298583984375, -0.23012542724609375, -0.1979522705078125, -0.16577911376953125, -0.13360595703125, -0.10143280029296875, -0.0692596435546875, -0.03708648681640625, -0.004913330078125, 0.02725982666015625, 0.0594329833984375, 0.09160614013671875, 0.123779296875, 0.15595245361328125, 0.1881256103515625, 0.22029876708984375, 0.252471923828125, 0.28464508056640625, 0.3168182373046875, 0.34899139404296875, 0.38116455078125, 0.41333770751953125, 0.4455108642578125, 0.47768402099609375, 0.509857177734375, 0.5420303344726562, 0.5742034912109375, 0.6063766479492188, 0.6385498046875, 0.6707229614257812, 0.7028961181640625, 0.7350692749023438, 0.767242431640625, 0.7994155883789062, 0.8315887451171875, 0.8637619018554688, 0.89593505859375, 0.9281082153320312, 0.9602813720703125, 0.9924545288085938, 1.024627685546875, 1.0568008422851562, 1.0889739990234375, 1.1211471557617188, 1.1533203125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 4.0, 5.0, 11.0, 18.0, 36.0, 49.0, 116.0, 265.0, 251.0, 105.0, 44.0, 27.0, 11.0, 5.0, 11.0, 5.0, 9.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014281272888183594, -0.0001384727656841278, -0.00013413280248641968, -0.00012979283928871155, -0.00012545287609100342, -0.00012111291289329529, -0.00011677294969558716, -0.00011243298649787903, -0.0001080930233001709, -0.00010375306010246277, -9.941309690475464e-05, -9.507313370704651e-05, -9.073317050933838e-05, -8.639320731163025e-05, -8.205324411392212e-05, -7.771328091621399e-05, -7.337331771850586e-05, -6.903335452079773e-05, -6.46933913230896e-05, -6.035342812538147e-05, -5.601346492767334e-05, -5.167350172996521e-05, -4.733353853225708e-05, -4.299357533454895e-05, -3.865361213684082e-05, -3.431364893913269e-05, -2.997368574142456e-05, -2.563372254371643e-05, -2.12937593460083e-05, -1.695379614830017e-05, -1.2613832950592041e-05, -8.273869752883911e-06, -3.933906555175781e-06, 4.0605664253234863e-07, 4.7460198402404785e-06, 9.085983037948608e-06, 1.3425946235656738e-05, 1.7765909433364868e-05, 2.2105872631072998e-05, 2.6445835828781128e-05, 3.078579902648926e-05, 3.512576222419739e-05, 3.946572542190552e-05, 4.380568861961365e-05, 4.814565181732178e-05, 5.248561501502991e-05, 5.682557821273804e-05, 6.116554141044617e-05, 6.55055046081543e-05, 6.984546780586243e-05, 7.418543100357056e-05, 7.852539420127869e-05, 8.286535739898682e-05, 8.720532059669495e-05, 9.154528379440308e-05, 9.58852469921112e-05, 0.00010022521018981934, 0.00010456517338752747, 0.0001089051365852356, 0.00011324509978294373, 0.00011758506298065186, 0.00012192502617835999, 0.00012626498937606812, 0.00013060495257377625, 0.00013494491577148438]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 8.0, 22.0, 32.0, 35.0, 76.0, 113.0, 215.0, 479.0, 1393.0, 4266.0, 18004.0, 916114.0, 94034.0, 9335.0, 2650.0, 941.0, 372.0, 176.0, 94.0, 48.0, 36.0, 30.0, 17.0, 11.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.005859375, -0.9709320068359375, -0.936004638671875, -0.9010772705078125, -0.86614990234375, -0.8312225341796875, -0.796295166015625, -0.7613677978515625, -0.7264404296875, -0.6915130615234375, -0.656585693359375, -0.6216583251953125, -0.58673095703125, -0.5518035888671875, -0.516876220703125, -0.4819488525390625, -0.447021484375, -0.4120941162109375, -0.377166748046875, -0.3422393798828125, -0.30731201171875, -0.2723846435546875, -0.237457275390625, -0.2025299072265625, -0.1676025390625, -0.1326751708984375, -0.097747802734375, -0.0628204345703125, -0.02789306640625, 0.0070343017578125, 0.041961669921875, 0.0768890380859375, 0.11181640625, 0.1467437744140625, 0.181671142578125, 0.2165985107421875, 0.25152587890625, 0.2864532470703125, 0.321380615234375, 0.3563079833984375, 0.3912353515625, 0.4261627197265625, 0.461090087890625, 0.4960174560546875, 0.53094482421875, 0.5658721923828125, 0.600799560546875, 0.6357269287109375, 0.670654296875, 0.7055816650390625, 0.740509033203125, 0.7754364013671875, 0.81036376953125, 0.8452911376953125, 0.880218505859375, 0.9151458740234375, 0.9500732421875, 0.9850006103515625, 1.019927978515625, 1.0548553466796875, 1.08978271484375, 1.1247100830078125, 1.159637451171875, 1.1945648193359375, 1.2294921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 4.0, 10.0, 11.0, 21.0, 40.0, 69.0, 394.0, 296.0, 57.0, 25.0, 20.0, 13.0, 8.0, 7.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322265625, -0.31072998046875, -0.2991943359375, -0.28765869140625, -0.276123046875, -0.26458740234375, -0.2530517578125, -0.24151611328125, -0.22998046875, -0.21844482421875, -0.2069091796875, -0.19537353515625, -0.183837890625, -0.17230224609375, -0.1607666015625, -0.14923095703125, -0.1376953125, -0.12615966796875, -0.1146240234375, -0.10308837890625, -0.091552734375, -0.08001708984375, -0.0684814453125, -0.05694580078125, -0.04541015625, -0.03387451171875, -0.0223388671875, -0.01080322265625, 0.000732421875, 0.01226806640625, 0.0238037109375, 0.03533935546875, 0.046875, 0.05841064453125, 0.0699462890625, 0.08148193359375, 0.093017578125, 0.10455322265625, 0.1160888671875, 0.12762451171875, 0.13916015625, 0.15069580078125, 0.1622314453125, 0.17376708984375, 0.185302734375, 0.19683837890625, 0.2083740234375, 0.21990966796875, 0.2314453125, 0.24298095703125, 0.2545166015625, 0.26605224609375, 0.277587890625, 0.28912353515625, 0.3006591796875, 0.31219482421875, 0.32373046875, 0.33526611328125, 0.3468017578125, 0.35833740234375, 0.369873046875, 0.38140869140625, 0.3929443359375, 0.40447998046875, 0.416015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 2.0, 5.0, 8.0, 20.0, 31.0, 64.0, 96.0, 110.0, 173.0, 157.0, 130.0, 75.0, 53.0, 30.0, 14.0, 15.0, 8.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.82423210144043, -12.486954689025879, -12.149678230285645, -11.812400817871094, -11.475123405456543, -11.137845993041992, -10.800569534301758, -10.463292121887207, -10.126014709472656, -9.788737297058105, -9.451460838317871, -9.11418342590332, -8.77690601348877, -8.439628601074219, -8.102352142333984, -7.765074729919434, -7.427798271179199, -7.090521335601807, -6.753243923187256, -6.415966987609863, -6.0786895751953125, -5.74141263961792, -5.404135704040527, -5.066858291625977, -4.729581356048584, -4.392304420471191, -4.055027008056641, -3.717750072479248, -3.3804728984832764, -3.0431957244873047, -2.705918788909912, -2.3686416149139404, -2.0313644409179688, -1.694087266921997, -1.356810212135315, -1.0195331573486328, -0.6822559833526611, -0.34497880935668945, -0.007701873779296875, 0.3295753002166748, 0.6668524742126465, 1.0041296482086182, 1.3414067029953003, 1.6786837577819824, 2.015960931777954, 2.353238105773926, 2.6905150413513184, 3.02779221534729, 3.3650693893432617, 3.7023465633392334, 4.039623737335205, 4.376900672912598, 4.714178085327148, 5.051455020904541, 5.388731956481934, 5.726009368896484, 6.063286304473877, 6.4005632400512695, 6.73784065246582, 7.075117588043213, 7.4123945236206055, 7.749671936035156, 8.08694839477539, 8.424225807189941, 8.761503219604492]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 7.0, 3.0, 3.0, 8.0, 15.0, 15.0, 17.0, 15.0, 18.0, 19.0, 43.0, 19.0, 26.0, 36.0, 37.0, 45.0, 29.0, 36.0, 39.0, 33.0, 41.0, 34.0, 32.0, 28.0, 37.0, 39.0, 38.0, 27.0, 37.0, 22.0, 28.0, 21.0, 18.0, 16.0, 12.0, 18.0, 15.0, 12.0, 10.0, 14.0, 4.0, 7.0, 3.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-12.192366600036621, -11.805703163146973, -11.41904067993164, -11.032377243041992, -10.645713806152344, -10.259051322937012, -9.872387886047363, -9.485725402832031, -9.099061965942383, -8.712398529052734, -8.325736045837402, -7.939072608947754, -7.552409648895264, -7.165746688842773, -6.779083251953125, -6.392420291900635, -6.0057573318481445, -5.619094371795654, -5.232431411743164, -4.845767974853516, -4.459105014801025, -4.072442054748535, -3.685778856277466, -3.2991156578063965, -2.9124526977539062, -2.525789737701416, -2.1391265392303467, -1.752463459968567, -1.365800380706787, -0.9791373014450073, -0.5924742221832275, -0.2058110237121582, 0.18085289001464844, 0.5675159692764282, 0.954179048538208, 1.3408421277999878, 1.7275052070617676, 2.114168167114258, 2.500831365585327, 2.8874945640563965, 3.2741575241088867, 3.660820484161377, 4.047483444213867, 4.434146881103516, 4.820809841156006, 5.207472801208496, 5.5941362380981445, 5.980799198150635, 6.367462158203125, 6.754125118255615, 7.1407880783081055, 7.527451515197754, 7.914114475250244, 8.300777435302734, 8.687440872192383, 9.074104309082031, 9.460766792297363, 9.847430229187012, 10.234092712402344, 10.620756149291992, 11.00741958618164, 11.394082069396973, 11.780745506286621, 12.167407989501953, 12.554071426391602]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 2.0, 15.0, 10.0, 21.0, 27.0, 32.0, 54.0, 67.0, 115.0, 310.0, 1112.0, 5704.0, 87145.0, 3159705.0, 912572.0, 23566.0, 2829.0, 541.0, 175.0, 90.0, 42.0, 33.0, 30.0, 26.0, 18.0, 13.0, 6.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.897216796875, -9.57568359375, -9.254150390625, -8.9326171875, -8.611083984375, -8.28955078125, -7.968017578125, -7.646484375, -7.324951171875, -7.00341796875, -6.681884765625, -6.3603515625, -6.038818359375, -5.71728515625, -5.395751953125, -5.07421875, -4.752685546875, -4.43115234375, -4.109619140625, -3.7880859375, -3.466552734375, -3.14501953125, -2.823486328125, -2.501953125, -2.180419921875, -1.85888671875, -1.537353515625, -1.2158203125, -0.894287109375, -0.57275390625, -0.251220703125, 0.0703125, 0.391845703125, 0.71337890625, 1.034912109375, 1.3564453125, 1.677978515625, 1.99951171875, 2.321044921875, 2.642578125, 2.964111328125, 3.28564453125, 3.607177734375, 3.9287109375, 4.250244140625, 4.57177734375, 4.893310546875, 5.21484375, 5.536376953125, 5.85791015625, 6.179443359375, 6.5009765625, 6.822509765625, 7.14404296875, 7.465576171875, 7.787109375, 8.108642578125, 8.43017578125, 8.751708984375, 9.0732421875, 9.394775390625, 9.71630859375, 10.037841796875, 10.359375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 12.0, 13.0, 19.0, 17.0, 28.0, 27.0, 40.0, 58.0, 46.0, 65.0, 65.0, 52.0, 68.0, 67.0, 68.0, 66.0, 53.0, 44.0, 39.0, 27.0, 27.0, 22.0, 24.0, 9.0, 12.0, 6.0, 6.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.02734375, -4.9033203125, -4.779296875, -4.6552734375, -4.53125, -4.4072265625, -4.283203125, -4.1591796875, -4.03515625, -3.9111328125, -3.787109375, -3.6630859375, -3.5390625, -3.4150390625, -3.291015625, -3.1669921875, -3.04296875, -2.9189453125, -2.794921875, -2.6708984375, -2.546875, -2.4228515625, -2.298828125, -2.1748046875, -2.05078125, -1.9267578125, -1.802734375, -1.6787109375, -1.5546875, -1.4306640625, -1.306640625, -1.1826171875, -1.05859375, -0.9345703125, -0.810546875, -0.6865234375, -0.5625, -0.4384765625, -0.314453125, -0.1904296875, -0.06640625, 0.0576171875, 0.181640625, 0.3056640625, 0.4296875, 0.5537109375, 0.677734375, 0.8017578125, 0.92578125, 1.0498046875, 1.173828125, 1.2978515625, 1.421875, 1.5458984375, 1.669921875, 1.7939453125, 1.91796875, 2.0419921875, 2.166015625, 2.2900390625, 2.4140625, 2.5380859375, 2.662109375, 2.7861328125, 2.91015625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 8.0, 13.0, 25.0, 44.0, 82.0, 127.0, 296.0, 788.0, 3465329.0, 726226.0, 743.0, 270.0, 156.0, 63.0, 37.0, 18.0, 7.0, 14.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-46.4375, -45.0703125, -43.703125, -42.3359375, -40.96875, -39.6015625, -38.234375, -36.8671875, -35.5, -34.1328125, -32.765625, -31.3984375, -30.03125, -28.6640625, -27.296875, -25.9296875, -24.5625, -23.1953125, -21.828125, -20.4609375, -19.09375, -17.7265625, -16.359375, -14.9921875, -13.625, -12.2578125, -10.890625, -9.5234375, -8.15625, -6.7890625, -5.421875, -4.0546875, -2.6875, -1.3203125, 0.046875, 1.4140625, 2.78125, 4.1484375, 5.515625, 6.8828125, 8.25, 9.6171875, 10.984375, 12.3515625, 13.71875, 15.0859375, 16.453125, 17.8203125, 19.1875, 20.5546875, 21.921875, 23.2890625, 24.65625, 26.0234375, 27.390625, 28.7578125, 30.125, 31.4921875, 32.859375, 34.2265625, 35.59375, 36.9609375, 38.328125, 39.6953125, 41.0625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 7.0, 6.0, 7.0, 11.0, 11.0, 20.0, 29.0, 41.0, 64.0, 69.0, 85.0, 158.0, 235.0, 355.0, 548.0, 619.0, 536.0, 401.0, 249.0, 182.0, 133.0, 90.0, 57.0, 44.0, 37.0, 22.0, 13.0, 10.0, 9.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5625, -1.5185699462890625, -1.474639892578125, -1.4307098388671875, -1.38677978515625, -1.3428497314453125, -1.298919677734375, -1.2549896240234375, -1.2110595703125, -1.1671295166015625, -1.123199462890625, -1.0792694091796875, -1.03533935546875, -0.9914093017578125, -0.947479248046875, -0.9035491943359375, -0.859619140625, -0.8156890869140625, -0.771759033203125, -0.7278289794921875, -0.68389892578125, -0.6399688720703125, -0.596038818359375, -0.5521087646484375, -0.5081787109375, -0.4642486572265625, -0.420318603515625, -0.3763885498046875, -0.33245849609375, -0.2885284423828125, -0.244598388671875, -0.2006683349609375, -0.15673828125, -0.1128082275390625, -0.068878173828125, -0.0249481201171875, 0.01898193359375, 0.0629119873046875, 0.106842041015625, 0.1507720947265625, 0.1947021484375, 0.2386322021484375, 0.282562255859375, 0.3264923095703125, 0.37042236328125, 0.4143524169921875, 0.458282470703125, 0.5022125244140625, 0.546142578125, 0.5900726318359375, 0.634002685546875, 0.6779327392578125, 0.72186279296875, 0.7657928466796875, 0.809722900390625, 0.8536529541015625, 0.8975830078125, 0.9415130615234375, 0.985443115234375, 1.0293731689453125, 1.07330322265625, 1.1172332763671875, 1.161163330078125, 1.2050933837890625, 1.2490234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 7.0, 1.0, 3.0, 11.0, 15.0, 27.0, 64.0, 102.0, 163.0, 189.0, 189.0, 114.0, 66.0, 35.0, 14.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7007694244384766, -3.357156276702881, -3.013542890548706, -2.6699295043945312, -2.3263163566589355, -1.9827030897140503, -1.639089822769165, -1.2954764366149902, -0.9518632888793945, -0.6082500219345093, -0.264636754989624, 0.07897651195526123, 0.4225897789001465, 0.7662030458450317, 1.109816312789917, 1.4534296989440918, 1.7970428466796875, 2.140655994415283, 2.484269380569458, 2.827882766723633, 3.1714959144592285, 3.515109062194824, 3.858722448348999, 4.202335834503174, 4.5459489822387695, 4.889562129974365, 5.233175277709961, 5.576788902282715, 5.9204020500183105, 6.264015197753906, 6.60762882232666, 6.951241970062256, 7.294855117797852, 7.638468265533447, 7.982081413269043, 8.325695037841797, 8.669307708740234, 9.012921333312988, 9.356534957885742, 9.70014762878418, 10.043761253356934, 10.387374877929688, 10.730987548828125, 11.074601173400879, 11.418214797973633, 11.76182746887207, 12.105441093444824, 12.449054718017578, 12.792667388916016, 13.13628101348877, 13.479893684387207, 13.823507308959961, 14.167119979858398, 14.510733604431152, 14.854347229003906, 15.197959899902344, 15.541573524475098, 15.885187149047852, 16.22879981994629, 16.572412490844727, 16.916027069091797, 17.259639739990234, 17.603252410888672, 17.946866989135742, 18.29047966003418]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 4.0, 9.0, 11.0, 14.0, 18.0, 22.0, 20.0, 26.0, 30.0, 32.0, 51.0, 55.0, 57.0, 47.0, 59.0, 53.0, 57.0, 50.0, 55.0, 50.0, 37.0, 48.0, 37.0, 36.0, 30.0, 15.0, 16.0, 16.0, 8.0, 8.0, 2.0, 10.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.379016399383545, -4.25968074798584, -4.140345096588135, -4.02100944519043, -3.9016737937927246, -3.7823381423950195, -3.6630024909973145, -3.5436666011810303, -3.424330949783325, -3.30499529838562, -3.185659646987915, -3.06632399559021, -2.946988344192505, -2.8276524543762207, -2.7083168029785156, -2.5889811515808105, -2.4696455001831055, -2.3503098487854004, -2.2309741973876953, -2.1116385459899902, -1.9923027753829956, -1.8729671239852905, -1.7536314725875854, -1.6342957019805908, -1.5149602890014648, -1.3956246376037598, -1.2762889862060547, -1.1569533348083496, -1.037617564201355, -0.9182819128036499, -0.7989462614059448, -0.679610550403595, -0.5602748394012451, -0.44093915820121765, -0.3216034770011902, -0.2022678256034851, -0.08293214440345764, 0.036403536796569824, 0.1557391881942749, 0.27507489919662476, 0.39441055059432983, 0.5137462019920349, 0.6330819129943848, 0.7524175643920898, 0.8717532157897949, 0.9910889267921448, 1.110424518585205, 1.2297602891921997, 1.3490959405899048, 1.4684315919876099, 1.587767243385315, 1.7071030139923096, 1.8264386653900146, 1.9457743167877197, 2.065109968185425, 2.18444561958313, 2.303781270980835, 2.42311692237854, 2.542452573776245, 2.66178822517395, 2.7811238765716553, 2.9004597663879395, 3.0197954177856445, 3.1391310691833496, 3.2584667205810547]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 11.0, 11.0, 15.0, 16.0, 28.0, 46.0, 48.0, 84.0, 111.0, 155.0, 328.0, 406.0, 748.0, 1292.0, 2368.0, 5003.0, 14236.0, 93268.0, 794623.0, 109129.0, 15405.0, 5282.0, 2506.0, 1335.0, 754.0, 462.0, 294.0, 179.0, 109.0, 92.0, 44.0, 48.0, 27.0, 33.0, 15.0, 7.0, 7.0, 8.0, 1.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9755859375, -0.9413909912109375, -0.907196044921875, -0.8730010986328125, -0.83880615234375, -0.8046112060546875, -0.770416259765625, -0.7362213134765625, -0.7020263671875, -0.6678314208984375, -0.633636474609375, -0.5994415283203125, -0.56524658203125, -0.5310516357421875, -0.496856689453125, -0.4626617431640625, -0.428466796875, -0.3942718505859375, -0.360076904296875, -0.3258819580078125, -0.29168701171875, -0.2574920654296875, -0.223297119140625, -0.1891021728515625, -0.1549072265625, -0.1207122802734375, -0.086517333984375, -0.0523223876953125, -0.01812744140625, 0.0160675048828125, 0.050262451171875, 0.0844573974609375, 0.11865234375, 0.1528472900390625, 0.187042236328125, 0.2212371826171875, 0.25543212890625, 0.2896270751953125, 0.323822021484375, 0.3580169677734375, 0.3922119140625, 0.4264068603515625, 0.460601806640625, 0.4947967529296875, 0.52899169921875, 0.5631866455078125, 0.597381591796875, 0.6315765380859375, 0.665771484375, 0.6999664306640625, 0.734161376953125, 0.7683563232421875, 0.80255126953125, 0.8367462158203125, 0.870941162109375, 0.9051361083984375, 0.9393310546875, 0.9735260009765625, 1.007720947265625, 1.0419158935546875, 1.07611083984375, 1.1103057861328125, 1.144500732421875, 1.1786956787109375, 1.212890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 4.0, 1.0, 7.0, 8.0, 6.0, 14.0, 17.0, 17.0, 25.0, 30.0, 28.0, 44.0, 46.0, 56.0, 56.0, 57.0, 61.0, 75.0, 58.0, 62.0, 48.0, 51.0, 46.0, 41.0, 32.0, 31.0, 18.0, 10.0, 12.0, 13.0, 5.0, 5.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.869140625, -2.789794921875, -2.71044921875, -2.631103515625, -2.5517578125, -2.472412109375, -2.39306640625, -2.313720703125, -2.234375, -2.155029296875, -2.07568359375, -1.996337890625, -1.9169921875, -1.837646484375, -1.75830078125, -1.678955078125, -1.599609375, -1.520263671875, -1.44091796875, -1.361572265625, -1.2822265625, -1.202880859375, -1.12353515625, -1.044189453125, -0.96484375, -0.885498046875, -0.80615234375, -0.726806640625, -0.6474609375, -0.568115234375, -0.48876953125, -0.409423828125, -0.330078125, -0.250732421875, -0.17138671875, -0.092041015625, -0.0126953125, 0.066650390625, 0.14599609375, 0.225341796875, 0.3046875, 0.384033203125, 0.46337890625, 0.542724609375, 0.6220703125, 0.701416015625, 0.78076171875, 0.860107421875, 0.939453125, 1.018798828125, 1.09814453125, 1.177490234375, 1.2568359375, 1.336181640625, 1.41552734375, 1.494873046875, 1.57421875, 1.653564453125, 1.73291015625, 1.812255859375, 1.8916015625, 1.970947265625, 2.05029296875, 2.129638671875, 2.208984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 12.0, 15.0, 25.0, 48.0, 41.0, 77.0, 97.0, 161.0, 212.0, 354.0, 525.0, 781.0, 1390.0, 2466.0, 4278.0, 8627.0, 17287.0, 39715.0, 107243.0, 344757.0, 340881.0, 105188.0, 39227.0, 17096.0, 8088.0, 4104.0, 2195.0, 1274.0, 746.0, 518.0, 363.0, 219.0, 141.0, 110.0, 78.0, 57.0, 30.0, 30.0, 16.0, 15.0, 7.0, 10.0, 5.0, 8.0, 10.0, 5.0, 4.0, 0.0, 4.0], "bins": [-0.28369140625, -0.2755851745605469, -0.26747894287109375, -0.2593727111816406, -0.2512664794921875, -0.24316024780273438, -0.23505401611328125, -0.22694778442382812, -0.218841552734375, -0.21073532104492188, -0.20262908935546875, -0.19452285766601562, -0.1864166259765625, -0.17831039428710938, -0.17020416259765625, -0.16209793090820312, -0.15399169921875, -0.14588546752929688, -0.13777923583984375, -0.12967300415039062, -0.1215667724609375, -0.11346054077148438, -0.10535430908203125, -0.09724807739257812, -0.089141845703125, -0.08103561401367188, -0.07292938232421875, -0.06482315063476562, -0.0567169189453125, -0.048610687255859375, -0.04050445556640625, -0.032398223876953125, -0.0242919921875, -0.016185760498046875, -0.00807952880859375, 2.6702880859375e-05, 0.0081329345703125, 0.016239166259765625, 0.02434539794921875, 0.032451629638671875, 0.040557861328125, 0.048664093017578125, 0.05677032470703125, 0.06487655639648438, 0.0729827880859375, 0.08108901977539062, 0.08919525146484375, 0.09730148315429688, 0.10540771484375, 0.11351394653320312, 0.12162017822265625, 0.12972640991210938, 0.1378326416015625, 0.14593887329101562, 0.15404510498046875, 0.16215133666992188, 0.170257568359375, 0.17836380004882812, 0.18647003173828125, 0.19457626342773438, 0.2026824951171875, 0.21078872680664062, 0.21889495849609375, 0.22700119018554688, 0.235107421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 9.0, 14.0, 14.0, 27.0, 34.0, 28.0, 42.0, 41.0, 41.0, 61.0, 55.0, 66.0, 63.0, 67.0, 72.0, 58.0, 56.0, 37.0, 43.0, 32.0, 30.0, 20.0, 17.0, 16.0, 13.0, 6.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.733642578125, -4.59228515625, -4.450927734375, -4.3095703125, -4.168212890625, -4.02685546875, -3.885498046875, -3.744140625, -3.602783203125, -3.46142578125, -3.320068359375, -3.1787109375, -3.037353515625, -2.89599609375, -2.754638671875, -2.61328125, -2.471923828125, -2.33056640625, -2.189208984375, -2.0478515625, -1.906494140625, -1.76513671875, -1.623779296875, -1.482421875, -1.341064453125, -1.19970703125, -1.058349609375, -0.9169921875, -0.775634765625, -0.63427734375, -0.492919921875, -0.3515625, -0.210205078125, -0.06884765625, 0.072509765625, 0.2138671875, 0.355224609375, 0.49658203125, 0.637939453125, 0.779296875, 0.920654296875, 1.06201171875, 1.203369140625, 1.3447265625, 1.486083984375, 1.62744140625, 1.768798828125, 1.91015625, 2.051513671875, 2.19287109375, 2.334228515625, 2.4755859375, 2.616943359375, 2.75830078125, 2.899658203125, 3.041015625, 3.182373046875, 3.32373046875, 3.465087890625, 3.6064453125, 3.747802734375, 3.88916015625, 4.030517578125, 4.171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 10.0, 18.0, 22.0, 26.0, 43.0, 72.0, 77.0, 136.0, 228.0, 415.0, 1284.0, 8291.0, 911089.0, 121711.0, 3807.0, 713.0, 260.0, 122.0, 82.0, 48.0, 36.0, 23.0, 10.0, 6.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1649169921875, -0.15989112854003906, -0.15486526489257812, -0.1498394012451172, -0.14481353759765625, -0.1397876739501953, -0.13476181030273438, -0.12973594665527344, -0.1247100830078125, -0.11968421936035156, -0.11465835571289062, -0.10963249206542969, -0.10460662841796875, -0.09958076477050781, -0.09455490112304688, -0.08952903747558594, -0.084503173828125, -0.07947731018066406, -0.07445144653320312, -0.06942558288574219, -0.06439971923828125, -0.05937385559082031, -0.054347991943359375, -0.04932212829589844, -0.0442962646484375, -0.03927040100097656, -0.034244537353515625, -0.029218673706054688, -0.02419281005859375, -0.019166946411132812, -0.014141082763671875, -0.009115219116210938, -0.00408935546875, 0.0009365081787109375, 0.005962371826171875, 0.010988235473632812, 0.01601409912109375, 0.021039962768554688, 0.026065826416015625, 0.031091690063476562, 0.0361175537109375, 0.04114341735839844, 0.046169281005859375, 0.05119514465332031, 0.05622100830078125, 0.06124687194824219, 0.06627273559570312, 0.07129859924316406, 0.076324462890625, 0.08135032653808594, 0.08637619018554688, 0.09140205383300781, 0.09642791748046875, 0.10145378112792969, 0.10647964477539062, 0.11150550842285156, 0.1165313720703125, 0.12155723571777344, 0.12658309936523438, 0.1316089630126953, 0.13663482666015625, 0.1416606903076172, 0.14668655395507812, 0.15171241760253906, 0.15673828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 2.0, 6.0, 4.0, 12.0, 20.0, 33.0, 38.0, 56.0, 69.0, 119.0, 109.0, 118.0, 126.0, 75.0, 61.0, 43.0, 48.0, 21.0, 11.0, 11.0, 6.0, 5.0, 1.0, 5.0, 2.0], "bins": [-7.551908493041992e-05, -7.401406764984131e-05, -7.25090503692627e-05, -7.100403308868408e-05, -6.949901580810547e-05, -6.799399852752686e-05, -6.648898124694824e-05, -6.498396396636963e-05, -6.347894668579102e-05, -6.19739294052124e-05, -6.046891212463379e-05, -5.8963894844055176e-05, -5.745887756347656e-05, -5.595386028289795e-05, -5.4448843002319336e-05, -5.294382572174072e-05, -5.143880844116211e-05, -4.9933791160583496e-05, -4.842877388000488e-05, -4.692375659942627e-05, -4.5418739318847656e-05, -4.391372203826904e-05, -4.240870475769043e-05, -4.0903687477111816e-05, -3.93986701965332e-05, -3.789365291595459e-05, -3.6388635635375977e-05, -3.488361835479736e-05, -3.337860107421875e-05, -3.187358379364014e-05, -3.0368566513061523e-05, -2.886354923248291e-05, -2.7358531951904297e-05, -2.5853514671325684e-05, -2.434849739074707e-05, -2.2843480110168457e-05, -2.1338462829589844e-05, -1.983344554901123e-05, -1.8328428268432617e-05, -1.6823410987854004e-05, -1.531839370727539e-05, -1.3813376426696777e-05, -1.2308359146118164e-05, -1.080334186553955e-05, -9.298324584960938e-06, -7.793307304382324e-06, -6.288290023803711e-06, -4.783272743225098e-06, -3.2782554626464844e-06, -1.773238182067871e-06, -2.682209014892578e-07, 1.2367963790893555e-06, 2.7418136596679688e-06, 4.246830940246582e-06, 5.751848220825195e-06, 7.256865501403809e-06, 8.761882781982422e-06, 1.0266900062561035e-05, 1.1771917343139648e-05, 1.3276934623718262e-05, 1.4781951904296875e-05, 1.6286969184875488e-05, 1.77919864654541e-05, 1.9297003746032715e-05, 2.0802021026611328e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 11.0, 19.0, 43.0, 122.0, 406.0, 1499.0, 19359.0, 1018712.0, 6876.0, 1030.0, 284.0, 106.0, 40.0, 16.0, 12.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3619537353515625, -0.351104736328125, -0.3402557373046875, -0.32940673828125, -0.3185577392578125, -0.307708740234375, -0.2968597412109375, -0.2860107421875, -0.2751617431640625, -0.264312744140625, -0.2534637451171875, -0.24261474609375, -0.2317657470703125, -0.220916748046875, -0.2100677490234375, -0.19921875, -0.1883697509765625, -0.177520751953125, -0.1666717529296875, -0.15582275390625, -0.1449737548828125, -0.134124755859375, -0.1232757568359375, -0.1124267578125, -0.1015777587890625, -0.090728759765625, -0.0798797607421875, -0.06903076171875, -0.0581817626953125, -0.047332763671875, -0.0364837646484375, -0.025634765625, -0.0147857666015625, -0.003936767578125, 0.0069122314453125, 0.01776123046875, 0.0286102294921875, 0.039459228515625, 0.0503082275390625, 0.0611572265625, 0.0720062255859375, 0.082855224609375, 0.0937042236328125, 0.10455322265625, 0.1154022216796875, 0.126251220703125, 0.1371002197265625, 0.14794921875, 0.1587982177734375, 0.169647216796875, 0.1804962158203125, 0.19134521484375, 0.2021942138671875, 0.213043212890625, 0.2238922119140625, 0.2347412109375, 0.2455902099609375, 0.256439208984375, 0.2672882080078125, 0.27813720703125, 0.2889862060546875, 0.299835205078125, 0.3106842041015625, 0.321533203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 8.0, 24.0, 65.0, 380.0, 406.0, 58.0, 26.0, 10.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047637939453125, -0.046236515045166016, -0.04483509063720703, -0.04343366622924805, -0.04203224182128906, -0.04063081741333008, -0.039229393005371094, -0.03782796859741211, -0.036426544189453125, -0.03502511978149414, -0.033623695373535156, -0.03222227096557617, -0.030820846557617188, -0.029419422149658203, -0.02801799774169922, -0.026616573333740234, -0.02521514892578125, -0.023813724517822266, -0.02241230010986328, -0.021010875701904297, -0.019609451293945312, -0.018208026885986328, -0.016806602478027344, -0.01540517807006836, -0.014003753662109375, -0.01260232925415039, -0.011200904846191406, -0.009799480438232422, -0.008398056030273438, -0.006996631622314453, -0.005595207214355469, -0.004193782806396484, -0.0027923583984375, -0.0013909339904785156, 1.049041748046875e-05, 0.0014119148254394531, 0.0028133392333984375, 0.004214763641357422, 0.005616188049316406, 0.007017612457275391, 0.008419036865234375, 0.00982046127319336, 0.011221885681152344, 0.012623310089111328, 0.014024734497070312, 0.015426158905029297, 0.01682758331298828, 0.018229007720947266, 0.01963043212890625, 0.021031856536865234, 0.02243328094482422, 0.023834705352783203, 0.025236129760742188, 0.026637554168701172, 0.028038978576660156, 0.02944040298461914, 0.030841827392578125, 0.03224325180053711, 0.033644676208496094, 0.03504610061645508, 0.03644752502441406, 0.03784894943237305, 0.03925037384033203, 0.040651798248291016, 0.04205322265625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 10.0, 10.0, 9.0, 13.0, 34.0, 55.0, 55.0, 81.0, 98.0, 103.0, 127.0, 109.0, 100.0, 52.0, 44.0, 25.0, 27.0, 16.0, 4.0, 4.0, 9.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.230142593383789, -2.11362886428833, -1.9971152544021606, -1.8806015253067017, -1.7640879154205322, -1.6475741863250732, -1.5310604572296143, -1.4145468473434448, -1.2980332374572754, -1.1815195083618164, -1.065005898475647, -0.948492169380188, -0.8319785594940186, -0.7154648303985596, -0.5989511609077454, -0.48243749141693115, -0.36592376232147217, -0.24941009283065796, -0.13289640843868256, -0.016382724046707153, 0.10013094544410706, 0.21664464473724365, 0.33315831422805786, 0.44967198371887207, 0.5661856532096863, 0.6826993227005005, 0.7992129921913147, 0.9157266616821289, 1.032240390777588, 1.1487541198730469, 1.2652677297592163, 1.3817813396453857, 1.4982950687408447, 1.6148087978363037, 1.7313224077224731, 1.8478361368179321, 1.9643497467041016, 2.0808634757995605, 2.1973772048950195, 2.3138909339904785, 2.4304044246673584, 2.5469181537628174, 2.6634318828582764, 2.7799453735351562, 2.8964591026306152, 3.012972831726074, 3.129486560821533, 3.246000289916992, 3.362514019012451, 3.47902774810791, 3.595541477203369, 3.712054967880249, 3.828568696975708, 3.945082426071167, 4.061595916748047, 4.178109645843506, 4.294623374938965, 4.411137104034424, 4.527650833129883, 4.644164562225342, 4.760678291320801, 4.877191543579102, 4.9937052726745605, 5.1102190017700195, 5.2267327308654785]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 1.0, 3.0, 5.0, 8.0, 6.0, 14.0, 16.0, 20.0, 21.0, 31.0, 32.0, 36.0, 58.0, 71.0, 60.0, 53.0, 62.0, 67.0, 59.0, 69.0, 47.0, 54.0, 42.0, 39.0, 36.0, 20.0, 13.0, 17.0, 12.0, 7.0, 7.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6596763134002686, -2.5811033248901367, -2.502530097961426, -2.423957109451294, -2.345384120941162, -2.266810894012451, -2.1882379055023193, -2.1096649169921875, -2.0310916900634766, -1.9525185823440552, -1.8739455938339233, -1.795372486114502, -1.7167994976043701, -1.6382263898849487, -1.5596532821655273, -1.4810802936553955, -1.4025073051452637, -1.3239341974258423, -1.2453612089157104, -1.166788101196289, -1.0882151126861572, -1.0096420049667358, -0.9310688972473145, -0.8524958491325378, -0.7739228010177612, -0.6953497529029846, -0.616776704788208, -0.5382035970687866, -0.45963054895401, -0.3810575008392334, -0.3024844229221344, -0.2239113450050354, -0.1453385353088379, -0.06676547229290009, 0.01180759072303772, 0.09038065373897552, 0.16895371675491333, 0.24752676486968994, 0.32609984278678894, 0.40467292070388794, 0.48324596881866455, 0.5618190169334412, 0.6403920650482178, 0.7189651727676392, 0.7975382208824158, 0.8761112689971924, 0.9546843767166138, 1.0332574844360352, 1.111830472946167, 1.1904035806655884, 1.2689765691757202, 1.3475496768951416, 1.4261226654052734, 1.5046957731246948, 1.5832688808441162, 1.661841869354248, 1.7404149770736694, 1.8189880847930908, 1.8975610733032227, 1.976134181022644, 2.0547072887420654, 2.1332802772521973, 2.211853265762329, 2.29042649269104, 2.368999481201172]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 5.0, 14.0, 15.0, 22.0, 28.0, 60.0, 86.0, 156.0, 285.0, 521.0, 1010.0, 1753.0, 3744.0, 8670.0, 27132.0, 151662.0, 699085.0, 116084.0, 23284.0, 7855.0, 3451.0, 1696.0, 837.0, 474.0, 240.0, 135.0, 88.0, 58.0, 30.0, 26.0, 11.0, 6.0, 11.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.7109375, -1.66265869140625, -1.6143798828125, -1.56610107421875, -1.517822265625, -1.46954345703125, -1.4212646484375, -1.37298583984375, -1.32470703125, -1.27642822265625, -1.2281494140625, -1.17987060546875, -1.131591796875, -1.08331298828125, -1.0350341796875, -0.98675537109375, -0.9384765625, -0.89019775390625, -0.8419189453125, -0.79364013671875, -0.745361328125, -0.69708251953125, -0.6488037109375, -0.60052490234375, -0.55224609375, -0.50396728515625, -0.4556884765625, -0.40740966796875, -0.359130859375, -0.31085205078125, -0.2625732421875, -0.21429443359375, -0.166015625, -0.11773681640625, -0.0694580078125, -0.02117919921875, 0.027099609375, 0.07537841796875, 0.1236572265625, 0.17193603515625, 0.22021484375, 0.26849365234375, 0.3167724609375, 0.36505126953125, 0.413330078125, 0.46160888671875, 0.5098876953125, 0.55816650390625, 0.6064453125, 0.65472412109375, 0.7030029296875, 0.75128173828125, 0.799560546875, 0.84783935546875, 0.8961181640625, 0.94439697265625, 0.99267578125, 1.04095458984375, 1.0892333984375, 1.13751220703125, 1.185791015625, 1.23406982421875, 1.2823486328125, 1.33062744140625, 1.37890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 7.0, 12.0, 11.0, 19.0, 21.0, 36.0, 26.0, 35.0, 33.0, 40.0, 54.0, 65.0, 62.0, 68.0, 53.0, 59.0, 67.0, 48.0, 50.0, 40.0, 39.0, 41.0, 26.0, 15.0, 17.0, 15.0, 8.0, 5.0, 4.0, 7.0, 1.0, 7.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.95703125, -5.7877197265625, -5.618408203125, -5.4490966796875, -5.27978515625, -5.1104736328125, -4.941162109375, -4.7718505859375, -4.6025390625, -4.4332275390625, -4.263916015625, -4.0946044921875, -3.92529296875, -3.7559814453125, -3.586669921875, -3.4173583984375, -3.248046875, -3.0787353515625, -2.909423828125, -2.7401123046875, -2.57080078125, -2.4014892578125, -2.232177734375, -2.0628662109375, -1.8935546875, -1.7242431640625, -1.554931640625, -1.3856201171875, -1.21630859375, -1.0469970703125, -0.877685546875, -0.7083740234375, -0.5390625, -0.3697509765625, -0.200439453125, -0.0311279296875, 0.13818359375, 0.3074951171875, 0.476806640625, 0.6461181640625, 0.8154296875, 0.9847412109375, 1.154052734375, 1.3233642578125, 1.49267578125, 1.6619873046875, 1.831298828125, 2.0006103515625, 2.169921875, 2.3392333984375, 2.508544921875, 2.6778564453125, 2.84716796875, 3.0164794921875, 3.185791015625, 3.3551025390625, 3.5244140625, 3.6937255859375, 3.863037109375, 4.0323486328125, 4.20166015625, 4.3709716796875, 4.540283203125, 4.7095947265625, 4.87890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 6.0, 8.0, 15.0, 18.0, 15.0, 19.0, 16.0, 22.0, 19.0, 33.0, 30.0, 37.0, 42.0, 46.0, 34.0, 90.0, 967.0, 1039687.0, 6839.0, 149.0, 45.0, 49.0, 36.0, 33.0, 26.0, 36.0, 30.0, 31.0, 28.0, 19.0, 15.0, 11.0, 18.0, 9.0, 8.0, 16.0, 9.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.875, -17.310791015625, -16.74658203125, -16.182373046875, -15.6181640625, -15.053955078125, -14.48974609375, -13.925537109375, -13.361328125, -12.797119140625, -12.23291015625, -11.668701171875, -11.1044921875, -10.540283203125, -9.97607421875, -9.411865234375, -8.84765625, -8.283447265625, -7.71923828125, -7.155029296875, -6.5908203125, -6.026611328125, -5.46240234375, -4.898193359375, -4.333984375, -3.769775390625, -3.20556640625, -2.641357421875, -2.0771484375, -1.512939453125, -0.94873046875, -0.384521484375, 0.1796875, 0.743896484375, 1.30810546875, 1.872314453125, 2.4365234375, 3.000732421875, 3.56494140625, 4.129150390625, 4.693359375, 5.257568359375, 5.82177734375, 6.385986328125, 6.9501953125, 7.514404296875, 8.07861328125, 8.642822265625, 9.20703125, 9.771240234375, 10.33544921875, 10.899658203125, 11.4638671875, 12.028076171875, 12.59228515625, 13.156494140625, 13.720703125, 14.284912109375, 14.84912109375, 15.413330078125, 15.9775390625, 16.541748046875, 17.10595703125, 17.670166015625, 18.234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 9.0, 8.0, 6.0, 6.0, 14.0, 15.0, 20.0, 23.0, 15.0, 23.0, 24.0, 28.0, 39.0, 36.0, 46.0, 38.0, 42.0, 40.0, 53.0, 36.0, 40.0, 44.0, 43.0, 45.0, 33.0, 27.0, 34.0, 30.0, 38.0, 22.0, 20.0, 14.0, 13.0, 13.0, 13.0, 12.0, 11.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.515625, -4.38262939453125, -4.2496337890625, -4.11663818359375, -3.983642578125, -3.85064697265625, -3.7176513671875, -3.58465576171875, -3.45166015625, -3.31866455078125, -3.1856689453125, -3.05267333984375, -2.919677734375, -2.78668212890625, -2.6536865234375, -2.52069091796875, -2.3876953125, -2.25469970703125, -2.1217041015625, -1.98870849609375, -1.855712890625, -1.72271728515625, -1.5897216796875, -1.45672607421875, -1.32373046875, -1.19073486328125, -1.0577392578125, -0.92474365234375, -0.791748046875, -0.65875244140625, -0.5257568359375, -0.39276123046875, -0.259765625, -0.12677001953125, 0.0062255859375, 0.13922119140625, 0.272216796875, 0.40521240234375, 0.5382080078125, 0.67120361328125, 0.80419921875, 0.93719482421875, 1.0701904296875, 1.20318603515625, 1.336181640625, 1.46917724609375, 1.6021728515625, 1.73516845703125, 1.8681640625, 2.00115966796875, 2.1341552734375, 2.26715087890625, 2.400146484375, 2.53314208984375, 2.6661376953125, 2.79913330078125, 2.93212890625, 3.06512451171875, 3.1981201171875, 3.33111572265625, 3.464111328125, 3.59710693359375, 3.7301025390625, 3.86309814453125, 3.99609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 9.0, 12.0, 21.0, 28.0, 33.0, 53.0, 76.0, 138.0, 312.0, 749.0, 2866.0, 14531.0, 157909.0, 820575.0, 42611.0, 6207.0, 1441.0, 491.0, 192.0, 110.0, 53.0, 35.0, 19.0, 18.0, 16.0, 7.0, 13.0, 5.0, 7.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.9658203125, -0.9405746459960938, -0.9153289794921875, -0.8900833129882812, -0.864837646484375, -0.8395919799804688, -0.8143463134765625, -0.7891006469726562, -0.76385498046875, -0.7386093139648438, -0.7133636474609375, -0.6881179809570312, -0.662872314453125, -0.6376266479492188, -0.6123809814453125, -0.5871353149414062, -0.5618896484375, -0.5366439819335938, -0.5113983154296875, -0.48615264892578125, -0.460906982421875, -0.43566131591796875, -0.4104156494140625, -0.38516998291015625, -0.35992431640625, -0.33467864990234375, -0.3094329833984375, -0.28418731689453125, -0.258941650390625, -0.23369598388671875, -0.2084503173828125, -0.18320465087890625, -0.157958984375, -0.13271331787109375, -0.1074676513671875, -0.08222198486328125, -0.056976318359375, -0.03173065185546875, -0.0064849853515625, 0.01876068115234375, 0.04400634765625, 0.06925201416015625, 0.0944976806640625, 0.11974334716796875, 0.144989013671875, 0.17023468017578125, 0.1954803466796875, 0.22072601318359375, 0.2459716796875, 0.27121734619140625, 0.2964630126953125, 0.32170867919921875, 0.346954345703125, 0.37220001220703125, 0.3974456787109375, 0.42269134521484375, 0.44793701171875, 0.47318267822265625, 0.4984283447265625, 0.5236740112304688, 0.548919677734375, 0.5741653442382812, 0.5994110107421875, 0.6246566772460938, 0.64990234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 12.0, 15.0, 11.0, 24.0, 36.0, 51.0, 86.0, 130.0, 164.0, 122.0, 107.0, 47.0, 32.0, 22.0, 22.0, 18.0, 16.0, 9.0, 3.0, 9.0, 6.0, 6.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.985664367675781e-05, -6.778072565793991e-05, -6.570480763912201e-05, -6.362888962030411e-05, -6.15529716014862e-05, -5.9477053582668304e-05, -5.74011355638504e-05, -5.53252175450325e-05, -5.32492995262146e-05, -5.11733815073967e-05, -4.9097463488578796e-05, -4.7021545469760895e-05, -4.494562745094299e-05, -4.286970943212509e-05, -4.079379141330719e-05, -3.871787339448929e-05, -3.664195537567139e-05, -3.4566037356853485e-05, -3.2490119338035583e-05, -3.0414201319217682e-05, -2.833828330039978e-05, -2.626236528158188e-05, -2.4186447262763977e-05, -2.2110529243946075e-05, -2.0034611225128174e-05, -1.7958693206310272e-05, -1.588277518749237e-05, -1.3806857168674469e-05, -1.1730939149856567e-05, -9.655021131038666e-06, -7.579103112220764e-06, -5.5031850934028625e-06, -3.427267074584961e-06, -1.3513490557670593e-06, 7.245689630508423e-07, 2.800486981868744e-06, 4.8764050006866455e-06, 6.952323019504547e-06, 9.028241038322449e-06, 1.110415905714035e-05, 1.3180077075958252e-05, 1.5255995094776154e-05, 1.7331913113594055e-05, 1.9407831132411957e-05, 2.148374915122986e-05, 2.355966717004776e-05, 2.563558518886566e-05, 2.7711503207683563e-05, 2.9787421226501465e-05, 3.1863339245319366e-05, 3.393925726413727e-05, 3.601517528295517e-05, 3.809109330177307e-05, 4.016701132059097e-05, 4.2242929339408875e-05, 4.4318847358226776e-05, 4.639476537704468e-05, 4.847068339586258e-05, 5.054660141468048e-05, 5.262251943349838e-05, 5.4698437452316284e-05, 5.6774355471134186e-05, 5.885027348995209e-05, 6.092619150876999e-05, 6.300210952758789e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 8.0, 9.0, 13.0, 19.0, 28.0, 35.0, 69.0, 107.0, 204.0, 446.0, 1024.0, 2831.0, 8911.0, 43163.0, 665999.0, 287035.0, 28238.0, 6546.0, 2168.0, 867.0, 377.0, 183.0, 102.0, 53.0, 26.0, 22.0, 11.0, 10.0, 11.0, 6.0, 8.0, 0.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6523895263671875, -0.631927490234375, -0.6114654541015625, -0.59100341796875, -0.5705413818359375, -0.550079345703125, -0.5296173095703125, -0.5091552734375, -0.4886932373046875, -0.468231201171875, -0.4477691650390625, -0.42730712890625, -0.4068450927734375, -0.386383056640625, -0.3659210205078125, -0.345458984375, -0.3249969482421875, -0.304534912109375, -0.2840728759765625, -0.26361083984375, -0.2431488037109375, -0.222686767578125, -0.2022247314453125, -0.1817626953125, -0.1613006591796875, -0.140838623046875, -0.1203765869140625, -0.09991455078125, -0.0794525146484375, -0.058990478515625, -0.0385284423828125, -0.01806640625, 0.0023956298828125, 0.022857666015625, 0.0433197021484375, 0.06378173828125, 0.0842437744140625, 0.104705810546875, 0.1251678466796875, 0.1456298828125, 0.1660919189453125, 0.186553955078125, 0.2070159912109375, 0.22747802734375, 0.2479400634765625, 0.268402099609375, 0.2888641357421875, 0.309326171875, 0.3297882080078125, 0.350250244140625, 0.3707122802734375, 0.39117431640625, 0.4116363525390625, 0.432098388671875, 0.4525604248046875, 0.4730224609375, 0.4934844970703125, 0.513946533203125, 0.5344085693359375, 0.55487060546875, 0.5753326416015625, 0.595794677734375, 0.6162567138671875, 0.63671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 0.0, 7.0, 8.0, 16.0, 14.0, 20.0, 22.0, 34.0, 38.0, 62.0, 84.0, 139.0, 180.0, 99.0, 80.0, 60.0, 33.0, 23.0, 14.0, 16.0, 11.0, 4.0, 7.0, 4.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1904296875, -0.18390464782714844, -0.17737960815429688, -0.1708545684814453, -0.16432952880859375, -0.1578044891357422, -0.15127944946289062, -0.14475440979003906, -0.1382293701171875, -0.13170433044433594, -0.12517929077148438, -0.11865425109863281, -0.11212921142578125, -0.10560417175292969, -0.09907913208007812, -0.09255409240722656, -0.086029052734375, -0.07950401306152344, -0.07297897338867188, -0.06645393371582031, -0.05992889404296875, -0.05340385437011719, -0.046878814697265625, -0.04035377502441406, -0.0338287353515625, -0.027303695678710938, -0.020778656005859375, -0.014253616333007812, -0.00772857666015625, -0.0012035369873046875, 0.005321502685546875, 0.011846542358398438, 0.01837158203125, 0.024896621704101562, 0.031421661376953125, 0.03794670104980469, 0.04447174072265625, 0.05099678039550781, 0.057521820068359375, 0.06404685974121094, 0.0705718994140625, 0.07709693908691406, 0.08362197875976562, 0.09014701843261719, 0.09667205810546875, 0.10319709777832031, 0.10972213745117188, 0.11624717712402344, 0.122772216796875, 0.12929725646972656, 0.13582229614257812, 0.1423473358154297, 0.14887237548828125, 0.1553974151611328, 0.16192245483398438, 0.16844749450683594, 0.1749725341796875, 0.18149757385253906, 0.18802261352539062, 0.1945476531982422, 0.20107269287109375, 0.2075977325439453, 0.21412277221679688, 0.22064781188964844, 0.2271728515625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 6.0, 7.0, 14.0, 18.0, 40.0, 66.0, 98.0, 129.0, 153.0, 143.0, 131.0, 77.0, 40.0, 45.0, 15.0, 7.0, 5.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5602850914001465, -4.252932071685791, -3.9455790519714355, -3.63822603225708, -3.3308730125427246, -3.023519992828369, -2.7161669731140137, -2.408813953399658, -2.1014609336853027, -1.7941079139709473, -1.4867548942565918, -1.1794018745422363, -0.8720488548278809, -0.5646958351135254, -0.2573428153991699, 0.05001020431518555, 0.357363224029541, 0.6647162437438965, 0.972069263458252, 1.2794222831726074, 1.586775302886963, 1.8941283226013184, 2.201481342315674, 2.5088343620300293, 2.8161873817443848, 3.1235404014587402, 3.4308934211730957, 3.738246440887451, 4.045599460601807, 4.352952480316162, 4.660305500030518, 4.967658519744873, 5.27501106262207, 5.582364082336426, 5.889717102050781, 6.197070121765137, 6.504423141479492, 6.811776161193848, 7.119129180908203, 7.426482200622559, 7.733835220336914, 8.04118824005127, 8.348541259765625, 8.65589427947998, 8.963247299194336, 9.270600318908691, 9.577953338623047, 9.885306358337402, 10.192659378051758, 10.500012397766113, 10.807365417480469, 11.114718437194824, 11.42207145690918, 11.729424476623535, 12.03677749633789, 12.344130516052246, 12.651483535766602, 12.958836555480957, 13.266189575195312, 13.573542594909668, 13.880895614624023, 14.188248634338379, 14.495601654052734, 14.80295467376709, 15.110307693481445]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 1.0, 8.0, 7.0, 13.0, 15.0, 8.0, 13.0, 20.0, 20.0, 26.0, 29.0, 21.0, 40.0, 41.0, 57.0, 38.0, 50.0, 50.0, 58.0, 42.0, 43.0, 42.0, 56.0, 44.0, 50.0, 31.0, 34.0, 25.0, 17.0, 22.0, 18.0, 13.0, 16.0, 9.0, 9.0, 0.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.838198184967041, -7.618335723876953, -7.398473262786865, -7.178610801696777, -6.958748817443848, -6.73888635635376, -6.519023895263672, -6.299161434173584, -6.079298973083496, -5.859436511993408, -5.63957405090332, -5.419712066650391, -5.199849605560303, -4.979987144470215, -4.760124683380127, -4.540262222290039, -4.320400238037109, -4.1005377769470215, -3.8806755542755127, -3.660813093185425, -3.440950870513916, -3.221088409423828, -3.0012259483337402, -2.7813634872436523, -2.5615012645721436, -2.3416388034820557, -2.121776580810547, -1.901914119720459, -1.6820517778396606, -1.4621894359588623, -1.2423269748687744, -1.022464632987976, -0.8026022911071777, -0.5827399492263794, -0.3628775477409363, -0.14301514625549316, 0.07684719562530518, 0.2967095375061035, 0.5165719985961914, 0.7364343404769897, 0.9562966823577881, 1.1761590242385864, 1.3960213661193848, 1.6158838272094727, 1.835746169090271, 2.0556085109710693, 2.2754709720611572, 2.495333194732666, 2.715195655822754, 2.935058116912842, 3.1549203395843506, 3.3747828006744385, 3.5946450233459473, 3.814507484436035, 4.034369945526123, 4.254232406616211, 4.474094390869141, 4.6939568519592285, 4.913819313049316, 5.133681297302246, 5.353543758392334, 5.573406219482422, 5.79326868057251, 6.013131141662598, 6.2329936027526855]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 8.0, 6.0, 11.0, 22.0, 33.0, 57.0, 47.0, 90.0, 166.0, 289.0, 517.0, 903.0, 1690.0, 3439.0, 8099.0, 21770.0, 71741.0, 324001.0, 1357085.0, 1761382.0, 487000.0, 104612.0, 30140.0, 11475.0, 4950.0, 2212.0, 1030.0, 598.0, 356.0, 218.0, 126.0, 70.0, 39.0, 34.0, 24.0, 9.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.576171875, -3.474395751953125, -3.37261962890625, -3.270843505859375, -3.1690673828125, -3.067291259765625, -2.96551513671875, -2.863739013671875, -2.761962890625, -2.660186767578125, -2.55841064453125, -2.456634521484375, -2.3548583984375, -2.253082275390625, -2.15130615234375, -2.049530029296875, -1.94775390625, -1.845977783203125, -1.74420166015625, -1.642425537109375, -1.5406494140625, -1.438873291015625, -1.33709716796875, -1.235321044921875, -1.133544921875, -1.031768798828125, -0.92999267578125, -0.828216552734375, -0.7264404296875, -0.624664306640625, -0.52288818359375, -0.421112060546875, -0.3193359375, -0.217559814453125, -0.11578369140625, -0.014007568359375, 0.0877685546875, 0.189544677734375, 0.29132080078125, 0.393096923828125, 0.494873046875, 0.596649169921875, 0.69842529296875, 0.800201416015625, 0.9019775390625, 1.003753662109375, 1.10552978515625, 1.207305908203125, 1.30908203125, 1.410858154296875, 1.51263427734375, 1.614410400390625, 1.7161865234375, 1.817962646484375, 1.91973876953125, 2.021514892578125, 2.123291015625, 2.225067138671875, 2.32684326171875, 2.428619384765625, 2.5303955078125, 2.632171630859375, 2.73394775390625, 2.835723876953125, 2.9375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 7.0, 4.0, 13.0, 18.0, 19.0, 18.0, 33.0, 36.0, 48.0, 50.0, 73.0, 70.0, 76.0, 57.0, 74.0, 71.0, 50.0, 53.0, 57.0, 38.0, 39.0, 25.0, 18.0, 14.0, 9.0, 12.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.1077880859375, -3.985107421875, -3.8624267578125, -3.73974609375, -3.6170654296875, -3.494384765625, -3.3717041015625, -3.2490234375, -3.1263427734375, -3.003662109375, -2.8809814453125, -2.75830078125, -2.6356201171875, -2.512939453125, -2.3902587890625, -2.267578125, -2.1448974609375, -2.022216796875, -1.8995361328125, -1.77685546875, -1.6541748046875, -1.531494140625, -1.4088134765625, -1.2861328125, -1.1634521484375, -1.040771484375, -0.9180908203125, -0.79541015625, -0.6727294921875, -0.550048828125, -0.4273681640625, -0.3046875, -0.1820068359375, -0.059326171875, 0.0633544921875, 0.18603515625, 0.3087158203125, 0.431396484375, 0.5540771484375, 0.6767578125, 0.7994384765625, 0.922119140625, 1.0447998046875, 1.16748046875, 1.2901611328125, 1.412841796875, 1.5355224609375, 1.658203125, 1.7808837890625, 1.903564453125, 2.0262451171875, 2.14892578125, 2.2716064453125, 2.394287109375, 2.5169677734375, 2.6396484375, 2.7623291015625, 2.885009765625, 3.0076904296875, 3.13037109375, 3.2530517578125, 3.375732421875, 3.4984130859375, 3.62109375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 11.0, 8.0, 17.0, 44.0, 60.0, 98.0, 268.0, 813.0, 5135.0, 180223.0, 3969487.0, 34776.0, 2359.0, 517.0, 218.0, 102.0, 50.0, 42.0, 26.0, 12.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4140625, -7.0491943359375, -6.684326171875, -6.3194580078125, -5.95458984375, -5.5897216796875, -5.224853515625, -4.8599853515625, -4.4951171875, -4.1302490234375, -3.765380859375, -3.4005126953125, -3.03564453125, -2.6707763671875, -2.305908203125, -1.9410400390625, -1.576171875, -1.2113037109375, -0.846435546875, -0.4815673828125, -0.11669921875, 0.2481689453125, 0.613037109375, 0.9779052734375, 1.3427734375, 1.7076416015625, 2.072509765625, 2.4373779296875, 2.80224609375, 3.1671142578125, 3.531982421875, 3.8968505859375, 4.26171875, 4.6265869140625, 4.991455078125, 5.3563232421875, 5.72119140625, 6.0860595703125, 6.450927734375, 6.8157958984375, 7.1806640625, 7.5455322265625, 7.910400390625, 8.2752685546875, 8.64013671875, 9.0050048828125, 9.369873046875, 9.7347412109375, 10.099609375, 10.4644775390625, 10.829345703125, 11.1942138671875, 11.55908203125, 11.9239501953125, 12.288818359375, 12.6536865234375, 13.0185546875, 13.3834228515625, 13.748291015625, 14.1131591796875, 14.47802734375, 14.8428955078125, 15.207763671875, 15.5726318359375, 15.9375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 8.0, 13.0, 31.0, 59.0, 78.0, 169.0, 298.0, 693.0, 991.0, 821.0, 439.0, 206.0, 107.0, 60.0, 32.0, 25.0, 10.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.900390625, -2.8324432373046875, -2.764495849609375, -2.6965484619140625, -2.62860107421875, -2.5606536865234375, -2.492706298828125, -2.4247589111328125, -2.3568115234375, -2.2888641357421875, -2.220916748046875, -2.1529693603515625, -2.08502197265625, -2.0170745849609375, -1.949127197265625, -1.8811798095703125, -1.813232421875, -1.7452850341796875, -1.677337646484375, -1.6093902587890625, -1.54144287109375, -1.4734954833984375, -1.405548095703125, -1.3376007080078125, -1.2696533203125, -1.2017059326171875, -1.133758544921875, -1.0658111572265625, -0.99786376953125, -0.9299163818359375, -0.861968994140625, -0.7940216064453125, -0.72607421875, -0.6581268310546875, -0.590179443359375, -0.5222320556640625, -0.45428466796875, -0.3863372802734375, -0.318389892578125, -0.2504425048828125, -0.1824951171875, -0.1145477294921875, -0.046600341796875, 0.0213470458984375, 0.08929443359375, 0.1572418212890625, 0.225189208984375, 0.2931365966796875, 0.361083984375, 0.4290313720703125, 0.496978759765625, 0.5649261474609375, 0.63287353515625, 0.7008209228515625, 0.768768310546875, 0.8367156982421875, 0.9046630859375, 0.9726104736328125, 1.040557861328125, 1.1085052490234375, 1.17645263671875, 1.2444000244140625, 1.312347412109375, 1.3802947998046875, 1.4482421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 9.0, 7.0, 8.0, 31.0, 41.0, 66.0, 93.0, 142.0, 135.0, 163.0, 114.0, 81.0, 50.0, 29.0, 20.0, 7.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.182204246520996, -3.919768810272217, -3.6573333740234375, -3.3948981761932373, -3.132462739944458, -2.8700273036956787, -2.6075921058654785, -2.345156669616699, -2.08272123336792, -1.8202857971191406, -1.5578504800796509, -1.2954151630401611, -1.0329797267913818, -0.7705442905426025, -0.5081089735031128, -0.24567365646362305, 0.01676177978515625, 0.27919715642929077, 0.5416325330734253, 0.8040679097175598, 1.0665032863616943, 1.3289387226104736, 1.5913740396499634, 1.8538093566894531, 2.1162447929382324, 2.3786802291870117, 2.641115665435791, 2.903550863265991, 3.1659862995147705, 3.42842173576355, 3.69085693359375, 3.9532923698425293, 4.215728759765625, 4.478164196014404, 4.740599632263184, 5.003035068511963, 5.265470504760742, 5.527905464172363, 5.790340900421143, 6.052776336669922, 6.315211772918701, 6.5776472091674805, 6.84008264541626, 7.102518081665039, 7.36495304107666, 7.627388954162598, 7.889823913574219, 8.152259826660156, 8.414694786071777, 8.677129745483398, 8.939565658569336, 9.202000617980957, 9.464436531066895, 9.726871490478516, 9.989307403564453, 10.251742362976074, 10.514177322387695, 10.776612281799316, 11.039048194885254, 11.301483154296875, 11.563919067382812, 11.826354026794434, 12.088789939880371, 12.351224899291992, 12.61366081237793]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 6.0, 8.0, 6.0, 11.0, 13.0, 22.0, 27.0, 28.0, 29.0, 32.0, 34.0, 59.0, 59.0, 45.0, 55.0, 49.0, 60.0, 71.0, 58.0, 68.0, 37.0, 40.0, 47.0, 32.0, 28.0, 20.0, 14.0, 9.0, 10.0, 8.0, 5.0, 4.0, 3.0, 0.0, 7.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.250951766967773, -4.130521774291992, -4.010091304779053, -3.8896613121032715, -3.769231081008911, -3.648800849914551, -3.5283708572387695, -3.407940626144409, -3.287510395050049, -3.1670801639556885, -3.046649932861328, -2.926219940185547, -2.8057897090911865, -2.685359477996826, -2.564929485321045, -2.4444992542266846, -2.324069023132324, -2.203638792037964, -2.0832085609436035, -1.9627785682678223, -1.842348337173462, -1.7219181060791016, -1.6014879941940308, -1.48105788230896, -1.3606276512145996, -1.2401974201202393, -1.1197673082351685, -0.9993371367454529, -0.8789069652557373, -0.7584767937660217, -0.6380466222763062, -0.5176164507865906, -0.3971865177154541, -0.2767563462257385, -0.15632617473602295, -0.03589600324630737, 0.0845341682434082, 0.20496433973312378, 0.32539451122283936, 0.44582468271255493, 0.5662548542022705, 0.6866850256919861, 0.8071151971817017, 0.9275453686714172, 1.0479755401611328, 1.1684057712554932, 1.288835883140564, 1.4092659950256348, 1.5296962261199951, 1.6501264572143555, 1.7705565690994263, 1.890986680984497, 2.0114169120788574, 2.1318471431732178, 2.252277374267578, 2.3727073669433594, 2.4931375980377197, 2.61356782913208, 2.7339978218078613, 2.8544280529022217, 2.974858283996582, 3.0952885150909424, 3.2157187461853027, 3.336148738861084, 3.4565789699554443]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 9.0, 10.0, 19.0, 24.0, 45.0, 46.0, 69.0, 139.0, 200.0, 365.0, 724.0, 1610.0, 4095.0, 15817.0, 164852.0, 786903.0, 59422.0, 8836.0, 2757.0, 1214.0, 605.0, 310.0, 183.0, 92.0, 56.0, 42.0, 29.0, 17.0, 13.0, 15.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1943359375, -1.1595306396484375, -1.124725341796875, -1.0899200439453125, -1.05511474609375, -1.0203094482421875, -0.985504150390625, -0.9506988525390625, -0.9158935546875, -0.8810882568359375, -0.846282958984375, -0.8114776611328125, -0.77667236328125, -0.7418670654296875, -0.707061767578125, -0.6722564697265625, -0.637451171875, -0.6026458740234375, -0.567840576171875, -0.5330352783203125, -0.49822998046875, -0.4634246826171875, -0.428619384765625, -0.3938140869140625, -0.3590087890625, -0.3242034912109375, -0.289398193359375, -0.2545928955078125, -0.21978759765625, -0.1849822998046875, -0.150177001953125, -0.1153717041015625, -0.08056640625, -0.0457611083984375, -0.010955810546875, 0.0238494873046875, 0.05865478515625, 0.0934600830078125, 0.128265380859375, 0.1630706787109375, 0.1978759765625, 0.2326812744140625, 0.267486572265625, 0.3022918701171875, 0.33709716796875, 0.3719024658203125, 0.406707763671875, 0.4415130615234375, 0.476318359375, 0.5111236572265625, 0.545928955078125, 0.5807342529296875, 0.61553955078125, 0.6503448486328125, 0.685150146484375, 0.7199554443359375, 0.7547607421875, 0.7895660400390625, 0.824371337890625, 0.8591766357421875, 0.89398193359375, 0.9287872314453125, 0.963592529296875, 0.9983978271484375, 1.033203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 6.0, 11.0, 21.0, 17.0, 37.0, 40.0, 46.0, 50.0, 57.0, 72.0, 64.0, 83.0, 57.0, 72.0, 78.0, 56.0, 44.0, 49.0, 41.0, 20.0, 19.0, 14.0, 11.0, 4.0, 10.0, 6.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.782257080078125, -2.69732666015625, -2.612396240234375, -2.5274658203125, -2.442535400390625, -2.35760498046875, -2.272674560546875, -2.187744140625, -2.102813720703125, -2.01788330078125, -1.932952880859375, -1.8480224609375, -1.763092041015625, -1.67816162109375, -1.593231201171875, -1.50830078125, -1.423370361328125, -1.33843994140625, -1.253509521484375, -1.1685791015625, -1.083648681640625, -0.99871826171875, -0.913787841796875, -0.828857421875, -0.743927001953125, -0.65899658203125, -0.574066162109375, -0.4891357421875, -0.404205322265625, -0.31927490234375, -0.234344482421875, -0.1494140625, -0.064483642578125, 0.02044677734375, 0.105377197265625, 0.1903076171875, 0.275238037109375, 0.36016845703125, 0.445098876953125, 0.530029296875, 0.614959716796875, 0.69989013671875, 0.784820556640625, 0.8697509765625, 0.954681396484375, 1.03961181640625, 1.124542236328125, 1.20947265625, 1.294403076171875, 1.37933349609375, 1.464263916015625, 1.5491943359375, 1.634124755859375, 1.71905517578125, 1.803985595703125, 1.888916015625, 1.973846435546875, 2.05877685546875, 2.143707275390625, 2.2286376953125, 2.313568115234375, 2.39849853515625, 2.483428955078125, 2.568359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 6.0, 11.0, 10.0, 20.0, 25.0, 25.0, 46.0, 62.0, 107.0, 140.0, 230.0, 352.0, 520.0, 782.0, 1256.0, 2029.0, 3254.0, 5531.0, 9449.0, 16968.0, 32062.0, 66343.0, 157898.0, 339935.0, 227086.0, 91595.0, 41917.0, 21654.0, 11865.0, 6678.0, 3923.0, 2478.0, 1513.0, 934.0, 599.0, 373.0, 290.0, 181.0, 127.0, 92.0, 46.0, 48.0, 29.0, 14.0, 16.0, 11.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.1895751953125, -0.18359375, -0.1776123046875, -0.171630859375, -0.1656494140625, -0.15966796875, -0.1536865234375, -0.147705078125, -0.1417236328125, -0.1357421875, -0.1297607421875, -0.123779296875, -0.1177978515625, -0.11181640625, -0.1058349609375, -0.099853515625, -0.0938720703125, -0.087890625, -0.0819091796875, -0.075927734375, -0.0699462890625, -0.06396484375, -0.0579833984375, -0.052001953125, -0.0460205078125, -0.0400390625, -0.0340576171875, -0.028076171875, -0.0220947265625, -0.01611328125, -0.0101318359375, -0.004150390625, 0.0018310546875, 0.0078125, 0.0137939453125, 0.019775390625, 0.0257568359375, 0.03173828125, 0.0377197265625, 0.043701171875, 0.0496826171875, 0.0556640625, 0.0616455078125, 0.067626953125, 0.0736083984375, 0.07958984375, 0.0855712890625, 0.091552734375, 0.0975341796875, 0.103515625, 0.1094970703125, 0.115478515625, 0.1214599609375, 0.12744140625, 0.1334228515625, 0.139404296875, 0.1453857421875, 0.1513671875, 0.1573486328125, 0.163330078125, 0.1693115234375, 0.17529296875, 0.1812744140625, 0.187255859375, 0.1932373046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 2.0, 3.0, 10.0, 6.0, 8.0, 13.0, 13.0, 14.0, 24.0, 26.0, 30.0, 38.0, 43.0, 44.0, 49.0, 58.0, 53.0, 65.0, 63.0, 35.0, 67.0, 55.0, 44.0, 31.0, 33.0, 28.0, 27.0, 24.0, 17.0, 17.0, 14.0, 11.0, 7.0, 5.0, 5.0, 8.0, 2.0, 2.0, 10.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.328125, -4.20562744140625, -4.0831298828125, -3.96063232421875, -3.838134765625, -3.71563720703125, -3.5931396484375, -3.47064208984375, -3.34814453125, -3.22564697265625, -3.1031494140625, -2.98065185546875, -2.858154296875, -2.73565673828125, -2.6131591796875, -2.49066162109375, -2.3681640625, -2.24566650390625, -2.1231689453125, -2.00067138671875, -1.878173828125, -1.75567626953125, -1.6331787109375, -1.51068115234375, -1.38818359375, -1.26568603515625, -1.1431884765625, -1.02069091796875, -0.898193359375, -0.77569580078125, -0.6531982421875, -0.53070068359375, -0.408203125, -0.28570556640625, -0.1632080078125, -0.04071044921875, 0.081787109375, 0.20428466796875, 0.3267822265625, 0.44927978515625, 0.57177734375, 0.69427490234375, 0.8167724609375, 0.93927001953125, 1.061767578125, 1.18426513671875, 1.3067626953125, 1.42926025390625, 1.5517578125, 1.67425537109375, 1.7967529296875, 1.91925048828125, 2.041748046875, 2.16424560546875, 2.2867431640625, 2.40924072265625, 2.53173828125, 2.65423583984375, 2.7767333984375, 2.89923095703125, 3.021728515625, 3.14422607421875, 3.2667236328125, 3.38922119140625, 3.51171875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 9.0, 9.0, 7.0, 15.0, 17.0, 30.0, 43.0, 74.0, 111.0, 183.0, 289.0, 549.0, 1102.0, 2439.0, 6856.0, 27410.0, 234815.0, 699455.0, 56374.0, 11724.0, 3777.0, 1591.0, 743.0, 393.0, 228.0, 135.0, 55.0, 35.0, 18.0, 23.0, 12.0, 7.0, 3.0, 6.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.07318115234375, -0.07104206085205078, -0.06890296936035156, -0.06676387786865234, -0.06462478637695312, -0.062485694885253906, -0.06034660339355469, -0.05820751190185547, -0.05606842041015625, -0.05392932891845703, -0.05179023742675781, -0.049651145935058594, -0.047512054443359375, -0.045372962951660156, -0.04323387145996094, -0.04109477996826172, -0.0389556884765625, -0.03681659698486328, -0.03467750549316406, -0.032538414001464844, -0.030399322509765625, -0.028260231018066406, -0.026121139526367188, -0.02398204803466797, -0.02184295654296875, -0.01970386505126953, -0.017564773559570312, -0.015425682067871094, -0.013286590576171875, -0.011147499084472656, -0.009008407592773438, -0.006869316101074219, -0.004730224609375, -0.0025911331176757812, -0.0004520416259765625, 0.0016870498657226562, 0.003826141357421875, 0.005965232849121094, 0.008104324340820312, 0.010243415832519531, 0.01238250732421875, 0.014521598815917969, 0.016660690307617188, 0.018799781799316406, 0.020938873291015625, 0.023077964782714844, 0.025217056274414062, 0.02735614776611328, 0.0294952392578125, 0.03163433074951172, 0.03377342224121094, 0.035912513732910156, 0.038051605224609375, 0.040190696716308594, 0.04232978820800781, 0.04446887969970703, 0.04660797119140625, 0.04874706268310547, 0.05088615417480469, 0.053025245666503906, 0.055164337158203125, 0.057303428649902344, 0.05944252014160156, 0.06158161163330078, 0.063720703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 7.0, 14.0, 18.0, 24.0, 20.0, 31.0, 40.0, 51.0, 74.0, 84.0, 104.0, 110.0, 97.0, 72.0, 59.0, 48.0, 36.0, 29.0, 14.0, 10.0, 13.0, 14.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.647804260253906e-05, -3.5305507481098175e-05, -3.413297235965729e-05, -3.29604372382164e-05, -3.178790211677551e-05, -3.0615366995334625e-05, -2.9442831873893738e-05, -2.827029675245285e-05, -2.7097761631011963e-05, -2.5925226509571075e-05, -2.4752691388130188e-05, -2.35801562666893e-05, -2.2407621145248413e-05, -2.1235086023807526e-05, -2.0062550902366638e-05, -1.889001578092575e-05, -1.7717480659484863e-05, -1.6544945538043976e-05, -1.537241041660309e-05, -1.4199875295162201e-05, -1.3027340173721313e-05, -1.1854805052280426e-05, -1.0682269930839539e-05, -9.509734809398651e-06, -8.337199687957764e-06, -7.164664566516876e-06, -5.992129445075989e-06, -4.819594323635101e-06, -3.647059202194214e-06, -2.4745240807533264e-06, -1.301988959312439e-06, -1.2945383787155151e-07, 1.043081283569336e-06, 2.2156164050102234e-06, 3.388151526451111e-06, 4.560686647891998e-06, 5.733221769332886e-06, 6.905756890773773e-06, 8.07829201221466e-06, 9.250827133655548e-06, 1.0423362255096436e-05, 1.1595897376537323e-05, 1.276843249797821e-05, 1.3940967619419098e-05, 1.5113502740859985e-05, 1.6286037862300873e-05, 1.745857298374176e-05, 1.8631108105182648e-05, 1.9803643226623535e-05, 2.0976178348064423e-05, 2.214871346950531e-05, 2.3321248590946198e-05, 2.4493783712387085e-05, 2.5666318833827972e-05, 2.683885395526886e-05, 2.8011389076709747e-05, 2.9183924198150635e-05, 3.0356459319591522e-05, 3.152899444103241e-05, 3.27015295624733e-05, 3.3874064683914185e-05, 3.504659980535507e-05, 3.621913492679596e-05, 3.739167004823685e-05, 3.8564205169677734e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 8.0, 5.0, 5.0, 16.0, 8.0, 16.0, 28.0, 54.0, 72.0, 144.0, 364.0, 1182.0, 4816.0, 29794.0, 605331.0, 377292.0, 23588.0, 4114.0, 1011.0, 357.0, 114.0, 75.0, 47.0, 42.0, 17.0, 13.0, 7.0, 4.0, 3.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10906982421875, -0.10565567016601562, -0.10224151611328125, -0.09882736206054688, -0.0954132080078125, -0.09199905395507812, -0.08858489990234375, -0.08517074584960938, -0.081756591796875, -0.07834243774414062, -0.07492828369140625, -0.07151412963867188, -0.0680999755859375, -0.06468582153320312, -0.06127166748046875, -0.057857513427734375, -0.054443359375, -0.051029205322265625, -0.04761505126953125, -0.044200897216796875, -0.0407867431640625, -0.037372589111328125, -0.03395843505859375, -0.030544281005859375, -0.027130126953125, -0.023715972900390625, -0.02030181884765625, -0.016887664794921875, -0.0134735107421875, -0.010059356689453125, -0.00664520263671875, -0.003231048583984375, 0.00018310546875, 0.003597259521484375, 0.00701141357421875, 0.010425567626953125, 0.0138397216796875, 0.017253875732421875, 0.02066802978515625, 0.024082183837890625, 0.027496337890625, 0.030910491943359375, 0.03432464599609375, 0.037738800048828125, 0.0411529541015625, 0.044567108154296875, 0.04798126220703125, 0.051395416259765625, 0.0548095703125, 0.058223724365234375, 0.06163787841796875, 0.06505203247070312, 0.0684661865234375, 0.07188034057617188, 0.07529449462890625, 0.07870864868164062, 0.082122802734375, 0.08553695678710938, 0.08895111083984375, 0.09236526489257812, 0.0957794189453125, 0.09919357299804688, 0.10260772705078125, 0.10602188110351562, 0.10943603515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 7.0, 6.0, 12.0, 14.0, 10.0, 17.0, 23.0, 35.0, 66.0, 70.0, 119.0, 163.0, 142.0, 90.0, 59.0, 32.0, 38.0, 25.0, 13.0, 10.0, 14.0, 12.0, 2.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020263671875, -0.019725918769836426, -0.01918816566467285, -0.018650412559509277, -0.018112659454345703, -0.01757490634918213, -0.017037153244018555, -0.01649940013885498, -0.015961647033691406, -0.015423893928527832, -0.014886140823364258, -0.014348387718200684, -0.01381063461303711, -0.013272881507873535, -0.012735128402709961, -0.012197375297546387, -0.011659622192382812, -0.011121869087219238, -0.010584115982055664, -0.01004636287689209, -0.009508609771728516, -0.008970856666564941, -0.008433103561401367, -0.007895350456237793, -0.007357597351074219, -0.0068198442459106445, -0.00628209114074707, -0.005744338035583496, -0.005206584930419922, -0.004668831825256348, -0.0041310787200927734, -0.0035933256149291992, -0.003055572509765625, -0.0025178194046020508, -0.0019800662994384766, -0.0014423131942749023, -0.0009045600891113281, -0.0003668069839477539, 0.0001709461212158203, 0.0007086992263793945, 0.0012464523315429688, 0.001784205436706543, 0.002321958541870117, 0.0028597116470336914, 0.0033974647521972656, 0.00393521785736084, 0.004472970962524414, 0.005010724067687988, 0.0055484771728515625, 0.006086230278015137, 0.006623983383178711, 0.007161736488342285, 0.007699489593505859, 0.008237242698669434, 0.008774995803833008, 0.009312748908996582, 0.009850502014160156, 0.01038825511932373, 0.010926008224487305, 0.011463761329650879, 0.012001514434814453, 0.012539267539978027, 0.013077020645141602, 0.013614773750305176, 0.01415252685546875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 13.0, 8.0, 11.0, 31.0, 34.0, 44.0, 94.0, 117.0, 117.0, 137.0, 123.0, 84.0, 62.0, 51.0, 22.0, 17.0, 16.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3899691104888916, -2.2656664848327637, -2.1413636207580566, -2.0170609951019287, -1.8927582502365112, -1.7684555053710938, -1.6441528797149658, -1.5198501348495483, -1.3955473899841309, -1.2712446451187134, -1.146941900253296, -1.022639274597168, -0.8983365297317505, -0.774033784866333, -0.6497310996055603, -0.5254284143447876, -0.4011256694793701, -0.276822954416275, -0.15252023935317993, -0.02821752429008484, 0.09608519077301025, 0.22038793563842773, 0.34469062089920044, 0.46899330615997314, 0.5932960510253906, 0.7175987958908081, 0.8419014811515808, 0.9662041664123535, 1.090506911277771, 1.2148096561431885, 1.3391122817993164, 1.4634150266647339, 1.5877175331115723, 1.7120202779769897, 1.8363230228424072, 1.9606256484985352, 2.084928512573242, 2.20923113822937, 2.333533763885498, 2.457836627960205, 2.582139253616333, 2.706441879272461, 2.830744743347168, 2.955047369003296, 3.079349994659424, 3.203652858734131, 3.327955484390259, 3.4522581100463867, 3.5765609741210938, 3.7008635997772217, 3.8251664638519287, 3.9494690895080566, 4.073771953582764, 4.1980743408203125, 4.3223772048950195, 4.446680068969727, 4.570982933044434, 4.695285797119141, 4.8195881843566895, 4.9438910484313965, 5.0681939125061035, 5.192496299743652, 5.316799163818359, 5.441102027893066, 5.565404415130615]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 8.0, 9.0, 14.0, 23.0, 26.0, 41.0, 37.0, 47.0, 68.0, 71.0, 46.0, 70.0, 79.0, 77.0, 90.0, 54.0, 46.0, 55.0, 39.0, 28.0, 17.0, 15.0, 11.0, 5.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6897177696228027, -2.6059787273406982, -2.5222394466400146, -2.43850040435791, -2.3547613620758057, -2.271022319793701, -2.1872830390930176, -2.103543996810913, -2.0198049545288086, -1.9360657930374146, -1.85232675075531, -1.768587589263916, -1.6848485469818115, -1.6011093854904175, -1.5173702239990234, -1.433631181716919, -1.349892020225525, -1.2661528587341309, -1.1824138164520264, -1.0986746549606323, -1.0149356126785278, -0.9311964511871338, -0.8474573493003845, -0.7637182474136353, -0.679979145526886, -0.5962400436401367, -0.5125009417533875, -0.4287618100643158, -0.34502270817756653, -0.26128360629081726, -0.1775444746017456, -0.09380537271499634, -0.01006627082824707, 0.0736728385090828, 0.15741194784641266, 0.24115106463432312, 0.3248901665210724, 0.40862926840782166, 0.4923684000968933, 0.5761075019836426, 0.6598466038703918, 0.7435857057571411, 0.8273248076438904, 0.9110639095306396, 0.9948030710220337, 1.0785421133041382, 1.1622812747955322, 1.2460203170776367, 1.3297594785690308, 1.4134986400604248, 1.4972376823425293, 1.5809768438339233, 1.6647158861160278, 1.7484550476074219, 1.8321940898895264, 1.9159332513809204, 1.9996724128723145, 2.083411455154419, 2.1671507358551025, 2.250889778137207, 2.3346288204193115, 2.418367862701416, 2.5021071434020996, 2.585846185684204, 2.6695852279663086]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 4.0, 13.0, 17.0, 35.0, 52.0, 72.0, 106.0, 207.0, 387.0, 710.0, 1399.0, 2766.0, 5878.0, 14716.0, 43678.0, 199342.0, 592624.0, 131911.0, 33043.0, 11814.0, 4917.0, 2328.0, 1133.0, 581.0, 293.0, 212.0, 119.0, 70.0, 42.0, 23.0, 19.0, 10.0, 7.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.720703125, -1.662139892578125, -1.60357666015625, -1.545013427734375, -1.4864501953125, -1.427886962890625, -1.36932373046875, -1.310760498046875, -1.252197265625, -1.193634033203125, -1.13507080078125, -1.076507568359375, -1.0179443359375, -0.959381103515625, -0.90081787109375, -0.842254638671875, -0.78369140625, -0.725128173828125, -0.66656494140625, -0.608001708984375, -0.5494384765625, -0.490875244140625, -0.43231201171875, -0.373748779296875, -0.315185546875, -0.256622314453125, -0.19805908203125, -0.139495849609375, -0.0809326171875, -0.022369384765625, 0.03619384765625, 0.094757080078125, 0.1533203125, 0.211883544921875, 0.27044677734375, 0.329010009765625, 0.3875732421875, 0.446136474609375, 0.50469970703125, 0.563262939453125, 0.621826171875, 0.680389404296875, 0.73895263671875, 0.797515869140625, 0.8560791015625, 0.914642333984375, 0.97320556640625, 1.031768798828125, 1.09033203125, 1.148895263671875, 1.20745849609375, 1.266021728515625, 1.3245849609375, 1.383148193359375, 1.44171142578125, 1.500274658203125, 1.558837890625, 1.617401123046875, 1.67596435546875, 1.734527587890625, 1.7930908203125, 1.851654052734375, 1.91021728515625, 1.968780517578125, 2.02734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 8.0, 6.0, 10.0, 18.0, 25.0, 27.0, 22.0, 31.0, 41.0, 44.0, 65.0, 58.0, 60.0, 58.0, 64.0, 71.0, 67.0, 50.0, 55.0, 41.0, 39.0, 25.0, 24.0, 17.0, 13.0, 12.0, 13.0, 10.0, 3.0, 3.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.22265625, -5.07391357421875, -4.9251708984375, -4.77642822265625, -4.627685546875, -4.47894287109375, -4.3302001953125, -4.18145751953125, -4.03271484375, -3.88397216796875, -3.7352294921875, -3.58648681640625, -3.437744140625, -3.28900146484375, -3.1402587890625, -2.99151611328125, -2.8427734375, -2.69403076171875, -2.5452880859375, -2.39654541015625, -2.247802734375, -2.09906005859375, -1.9503173828125, -1.80157470703125, -1.65283203125, -1.50408935546875, -1.3553466796875, -1.20660400390625, -1.057861328125, -0.90911865234375, -0.7603759765625, -0.61163330078125, -0.462890625, -0.31414794921875, -0.1654052734375, -0.01666259765625, 0.132080078125, 0.28082275390625, 0.4295654296875, 0.57830810546875, 0.72705078125, 0.87579345703125, 1.0245361328125, 1.17327880859375, 1.322021484375, 1.47076416015625, 1.6195068359375, 1.76824951171875, 1.9169921875, 2.06573486328125, 2.2144775390625, 2.36322021484375, 2.511962890625, 2.66070556640625, 2.8094482421875, 2.95819091796875, 3.10693359375, 3.25567626953125, 3.4044189453125, 3.55316162109375, 3.701904296875, 3.85064697265625, 3.9993896484375, 4.14813232421875, 4.296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 6.0, 8.0, 8.0, 13.0, 9.0, 19.0, 21.0, 24.0, 24.0, 28.0, 28.0, 36.0, 31.0, 42.0, 67.0, 109.0, 529.0, 201380.0, 844833.0, 850.0, 112.0, 56.0, 46.0, 34.0, 41.0, 45.0, 29.0, 31.0, 15.0, 13.0, 16.0, 13.0, 10.0, 2.0, 6.0, 2.0, 2.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.234375, -13.803955078125, -13.37353515625, -12.943115234375, -12.5126953125, -12.082275390625, -11.65185546875, -11.221435546875, -10.791015625, -10.360595703125, -9.93017578125, -9.499755859375, -9.0693359375, -8.638916015625, -8.20849609375, -7.778076171875, -7.34765625, -6.917236328125, -6.48681640625, -6.056396484375, -5.6259765625, -5.195556640625, -4.76513671875, -4.334716796875, -3.904296875, -3.473876953125, -3.04345703125, -2.613037109375, -2.1826171875, -1.752197265625, -1.32177734375, -0.891357421875, -0.4609375, -0.030517578125, 0.39990234375, 0.830322265625, 1.2607421875, 1.691162109375, 2.12158203125, 2.552001953125, 2.982421875, 3.412841796875, 3.84326171875, 4.273681640625, 4.7041015625, 5.134521484375, 5.56494140625, 5.995361328125, 6.42578125, 6.856201171875, 7.28662109375, 7.717041015625, 8.1474609375, 8.577880859375, 9.00830078125, 9.438720703125, 9.869140625, 10.299560546875, 10.72998046875, 11.160400390625, 11.5908203125, 12.021240234375, 12.45166015625, 12.882080078125, 13.3125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 9.0, 11.0, 11.0, 11.0, 18.0, 23.0, 17.0, 27.0, 28.0, 33.0, 34.0, 40.0, 42.0, 46.0, 43.0, 44.0, 54.0, 66.0, 46.0, 37.0, 37.0, 33.0, 34.0, 41.0, 42.0, 34.0, 19.0, 26.0, 11.0, 16.0, 20.0, 10.0, 11.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.943359375, -3.820465087890625, -3.69757080078125, -3.574676513671875, -3.4517822265625, -3.328887939453125, -3.20599365234375, -3.083099365234375, -2.960205078125, -2.837310791015625, -2.71441650390625, -2.591522216796875, -2.4686279296875, -2.345733642578125, -2.22283935546875, -2.099945068359375, -1.97705078125, -1.854156494140625, -1.73126220703125, -1.608367919921875, -1.4854736328125, -1.362579345703125, -1.23968505859375, -1.116790771484375, -0.993896484375, -0.871002197265625, -0.74810791015625, -0.625213623046875, -0.5023193359375, -0.379425048828125, -0.25653076171875, -0.133636474609375, -0.0107421875, 0.112152099609375, 0.23504638671875, 0.357940673828125, 0.4808349609375, 0.603729248046875, 0.72662353515625, 0.849517822265625, 0.972412109375, 1.095306396484375, 1.21820068359375, 1.341094970703125, 1.4639892578125, 1.586883544921875, 1.70977783203125, 1.832672119140625, 1.95556640625, 2.078460693359375, 2.20135498046875, 2.324249267578125, 2.4471435546875, 2.570037841796875, 2.69293212890625, 2.815826416015625, 2.938720703125, 3.061614990234375, 3.18450927734375, 3.307403564453125, 3.4302978515625, 3.553192138671875, 3.67608642578125, 3.798980712890625, 3.921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 14.0, 11.0, 19.0, 22.0, 37.0, 67.0, 106.0, 180.0, 351.0, 704.0, 1696.0, 4394.0, 13786.0, 61373.0, 599624.0, 311800.0, 38533.0, 9921.0, 3238.0, 1349.0, 580.0, 311.0, 142.0, 96.0, 55.0, 40.0, 24.0, 21.0, 12.0, 10.0, 9.0, 5.0, 2.0, 9.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8466796875, -0.8216781616210938, -0.7966766357421875, -0.7716751098632812, -0.746673583984375, -0.7216720581054688, -0.6966705322265625, -0.6716690063476562, -0.64666748046875, -0.6216659545898438, -0.5966644287109375, -0.5716629028320312, -0.546661376953125, -0.5216598510742188, -0.4966583251953125, -0.47165679931640625, -0.4466552734375, -0.42165374755859375, -0.3966522216796875, -0.37165069580078125, -0.346649169921875, -0.32164764404296875, -0.2966461181640625, -0.27164459228515625, -0.24664306640625, -0.22164154052734375, -0.1966400146484375, -0.17163848876953125, -0.146636962890625, -0.12163543701171875, -0.0966339111328125, -0.07163238525390625, -0.046630859375, -0.02162933349609375, 0.0033721923828125, 0.02837371826171875, 0.053375244140625, 0.07837677001953125, 0.1033782958984375, 0.12837982177734375, 0.15338134765625, 0.17838287353515625, 0.2033843994140625, 0.22838592529296875, 0.253387451171875, 0.27838897705078125, 0.3033905029296875, 0.32839202880859375, 0.3533935546875, 0.37839508056640625, 0.4033966064453125, 0.42839813232421875, 0.453399658203125, 0.47840118408203125, 0.5034027099609375, 0.5284042358398438, 0.55340576171875, 0.5784072875976562, 0.6034088134765625, 0.6284103393554688, 0.653411865234375, 0.6784133911132812, 0.7034149169921875, 0.7284164428710938, 0.75341796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 0.0, 5.0, 0.0, 4.0, 10.0, 10.0, 10.0, 16.0, 22.0, 31.0, 40.0, 61.0, 100.0, 158.0, 159.0, 97.0, 80.0, 55.0, 32.0, 30.0, 19.0, 22.0, 12.0, 4.0, 5.0, 5.0, 1.0, 10.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011527538299560547, -0.00011168047785758972, -0.00010808557271957397, -0.00010449066758155823, -0.00010089576244354248, -9.730085730552673e-05, -9.370595216751099e-05, -9.011104702949524e-05, -8.651614189147949e-05, -8.292123675346375e-05, -7.9326331615448e-05, -7.573142647743225e-05, -7.21365213394165e-05, -6.854161620140076e-05, -6.494671106338501e-05, -6.135180592536926e-05, -5.7756900787353516e-05, -5.416199564933777e-05, -5.056709051132202e-05, -4.6972185373306274e-05, -4.337728023529053e-05, -3.978237509727478e-05, -3.618746995925903e-05, -3.2592564821243286e-05, -2.899765968322754e-05, -2.5402754545211792e-05, -2.1807849407196045e-05, -1.8212944269180298e-05, -1.461803913116455e-05, -1.1023133993148804e-05, -7.428228855133057e-06, -3.8333237171173096e-06, -2.384185791015625e-07, 3.3564865589141846e-06, 6.951391696929932e-06, 1.0546296834945679e-05, 1.4141201972961426e-05, 1.7736107110977173e-05, 2.133101224899292e-05, 2.4925917387008667e-05, 2.8520822525024414e-05, 3.211572766304016e-05, 3.571063280105591e-05, 3.9305537939071655e-05, 4.29004430770874e-05, 4.649534821510315e-05, 5.0090253353118896e-05, 5.3685158491134644e-05, 5.728006362915039e-05, 6.087496876716614e-05, 6.446987390518188e-05, 6.806477904319763e-05, 7.165968418121338e-05, 7.525458931922913e-05, 7.884949445724487e-05, 8.244439959526062e-05, 8.603930473327637e-05, 8.963420987129211e-05, 9.322911500930786e-05, 9.682402014732361e-05, 0.00010041892528533936, 0.0001040138304233551, 0.00010760873556137085, 0.0001112036406993866, 0.00011479854583740234]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 13.0, 11.0, 15.0, 21.0, 30.0, 42.0, 60.0, 123.0, 164.0, 274.0, 564.0, 1120.0, 2437.0, 6272.0, 19041.0, 71941.0, 551892.0, 319461.0, 51495.0, 14364.0, 5128.0, 1991.0, 937.0, 448.0, 280.0, 129.0, 91.0, 44.0, 39.0, 27.0, 22.0, 18.0, 12.0, 8.0, 4.0, 6.0, 2.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74560546875, -0.722930908203125, -0.70025634765625, -0.677581787109375, -0.6549072265625, -0.632232666015625, -0.60955810546875, -0.586883544921875, -0.564208984375, -0.541534423828125, -0.51885986328125, -0.496185302734375, -0.4735107421875, -0.450836181640625, -0.42816162109375, -0.405487060546875, -0.3828125, -0.360137939453125, -0.33746337890625, -0.314788818359375, -0.2921142578125, -0.269439697265625, -0.24676513671875, -0.224090576171875, -0.201416015625, -0.178741455078125, -0.15606689453125, -0.133392333984375, -0.1107177734375, -0.088043212890625, -0.06536865234375, -0.042694091796875, -0.02001953125, 0.002655029296875, 0.02532958984375, 0.048004150390625, 0.0706787109375, 0.093353271484375, 0.11602783203125, 0.138702392578125, 0.161376953125, 0.184051513671875, 0.20672607421875, 0.229400634765625, 0.2520751953125, 0.274749755859375, 0.29742431640625, 0.320098876953125, 0.3427734375, 0.365447998046875, 0.38812255859375, 0.410797119140625, 0.4334716796875, 0.456146240234375, 0.47882080078125, 0.501495361328125, 0.524169921875, 0.546844482421875, 0.56951904296875, 0.592193603515625, 0.6148681640625, 0.637542724609375, 0.66021728515625, 0.682891845703125, 0.70556640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 4.0, 8.0, 10.0, 13.0, 10.0, 13.0, 18.0, 22.0, 21.0, 29.0, 39.0, 54.0, 77.0, 104.0, 115.0, 104.0, 70.0, 49.0, 37.0, 25.0, 31.0, 19.0, 24.0, 12.0, 14.0, 19.0, 8.0, 11.0, 2.0, 10.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.28466796875, -0.2768898010253906, -0.26911163330078125, -0.2613334655761719, -0.2535552978515625, -0.24577713012695312, -0.23799896240234375, -0.23022079467773438, -0.222442626953125, -0.21466445922851562, -0.20688629150390625, -0.19910812377929688, -0.1913299560546875, -0.18355178833007812, -0.17577362060546875, -0.16799545288085938, -0.16021728515625, -0.15243911743164062, -0.14466094970703125, -0.13688278198242188, -0.1291046142578125, -0.12132644653320312, -0.11354827880859375, -0.10577011108398438, -0.097991943359375, -0.09021377563476562, -0.08243560791015625, -0.07465744018554688, -0.0668792724609375, -0.059101104736328125, -0.05132293701171875, -0.043544769287109375, -0.0357666015625, -0.027988433837890625, -0.02021026611328125, -0.012432098388671875, -0.0046539306640625, 0.003124237060546875, 0.01090240478515625, 0.018680572509765625, 0.026458740234375, 0.034236907958984375, 0.04201507568359375, 0.049793243408203125, 0.0575714111328125, 0.06534957885742188, 0.07312774658203125, 0.08090591430664062, 0.08868408203125, 0.09646224975585938, 0.10424041748046875, 0.11201858520507812, 0.1197967529296875, 0.12757492065429688, 0.13535308837890625, 0.14313125610351562, 0.150909423828125, 0.15868759155273438, 0.16646575927734375, 0.17424392700195312, 0.1820220947265625, 0.18980026245117188, 0.19757843017578125, 0.20535659790039062, 0.213134765625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 4.0, 16.0, 79.0, 237.0, 439.0, 177.0, 47.0, 12.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61046838760376, -3.756706714630127, -2.902945041656494, -2.0491833686828613, -1.1954216957092285, -0.3416600227355957, 0.5121016502380371, 1.36586332321167, 2.2196249961853027, 3.0733866691589355, 3.9271483421325684, 4.780910015106201, 5.634671688079834, 6.488433361053467, 7.3421950340271, 8.19595718383789, 9.049718856811523, 9.903480529785156, 10.757242202758789, 11.611003875732422, 12.464765548706055, 13.318527221679688, 14.17228889465332, 15.026050567626953, 15.879812240600586, 16.73357391357422, 17.58733558654785, 18.441097259521484, 19.294858932495117, 20.14862060546875, 21.002382278442383, 21.856143951416016, 22.709903717041016, 23.56366539001465, 24.41742706298828, 25.271188735961914, 26.124950408935547, 26.97871208190918, 27.832473754882812, 28.686235427856445, 29.539997100830078, 30.39375877380371, 31.247520446777344, 32.101280212402344, 32.95504379272461, 33.808807373046875, 34.662567138671875, 35.516326904296875, 36.37009048461914, 37.223854064941406, 38.077613830566406, 38.931373596191406, 39.78513717651367, 40.63890075683594, 41.49266052246094, 42.34642028808594, 43.2001838684082, 44.05394744873047, 44.90770721435547, 45.76146697998047, 46.615230560302734, 47.468994140625, 48.32275390625, 49.176513671875, 50.030277252197266]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 6.0, 8.0, 11.0, 12.0, 21.0, 20.0, 14.0, 30.0, 32.0, 32.0, 31.0, 55.0, 41.0, 52.0, 50.0, 53.0, 66.0, 54.0, 54.0, 48.0, 50.0, 40.0, 35.0, 31.0, 23.0, 30.0, 23.0, 16.0, 10.0, 9.0, 6.0, 10.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.082514762878418, -7.8463239669799805, -7.610133171081543, -7.3739423751831055, -7.13775110244751, -6.901560306549072, -6.665369510650635, -6.429178714752197, -6.192987442016602, -5.956796646118164, -5.720605850219727, -5.484415054321289, -5.248223781585693, -5.012032985687256, -4.775842189788818, -4.539651393890381, -4.303460597991943, -4.067269802093506, -3.8310787677764893, -3.5948879718780518, -3.358696937561035, -3.1225061416625977, -2.88631534576416, -2.6501245498657227, -2.413933515548706, -2.1777427196502686, -1.941551685333252, -1.7053608894348145, -1.4691699743270874, -1.2329790592193604, -0.9967882633209229, -0.7605973482131958, -0.5244064331054688, -0.2882155478000641, -0.052024662494659424, 0.18416619300842285, 0.4203571081161499, 0.656548023223877, 0.8927388191223145, 1.1289297342300415, 1.3651206493377686, 1.6013115644454956, 1.8375024795532227, 2.07369327545166, 2.3098840713500977, 2.5460751056671143, 2.7822659015655518, 3.0184569358825684, 3.254647731781006, 3.4908385276794434, 3.72702956199646, 3.9632203578948975, 4.199411392211914, 4.435602188110352, 4.671792984008789, 4.907983779907227, 5.144174575805664, 5.380365371704102, 5.616556167602539, 5.852746963500977, 6.088938236236572, 6.32512903213501, 6.561319828033447, 6.797510623931885, 7.0337018966674805]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 17.0, 14.0, 24.0, 29.0, 59.0, 65.0, 99.0, 190.0, 344.0, 673.0, 1271.0, 2783.0, 6755.0, 17586.0, 61850.0, 298004.0, 1566987.0, 1759518.0, 366687.0, 73480.0, 22596.0, 8537.0, 3531.0, 1486.0, 711.0, 403.0, 235.0, 128.0, 82.0, 34.0, 35.0, 24.0, 9.0, 10.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0], "bins": [-4.37890625, -4.26385498046875, -4.1488037109375, -4.03375244140625, -3.918701171875, -3.80364990234375, -3.6885986328125, -3.57354736328125, -3.45849609375, -3.34344482421875, -3.2283935546875, -3.11334228515625, -2.998291015625, -2.88323974609375, -2.7681884765625, -2.65313720703125, -2.5380859375, -2.42303466796875, -2.3079833984375, -2.19293212890625, -2.077880859375, -1.96282958984375, -1.8477783203125, -1.73272705078125, -1.61767578125, -1.50262451171875, -1.3875732421875, -1.27252197265625, -1.157470703125, -1.04241943359375, -0.9273681640625, -0.81231689453125, -0.697265625, -0.58221435546875, -0.4671630859375, -0.35211181640625, -0.237060546875, -0.12200927734375, -0.0069580078125, 0.10809326171875, 0.22314453125, 0.33819580078125, 0.4532470703125, 0.56829833984375, 0.683349609375, 0.79840087890625, 0.9134521484375, 1.02850341796875, 1.1435546875, 1.25860595703125, 1.3736572265625, 1.48870849609375, 1.603759765625, 1.71881103515625, 1.8338623046875, 1.94891357421875, 2.06396484375, 2.17901611328125, 2.2940673828125, 2.40911865234375, 2.524169921875, 2.63922119140625, 2.7542724609375, 2.86932373046875, 2.984375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 20.0, 22.0, 29.0, 40.0, 40.0, 51.0, 72.0, 60.0, 76.0, 75.0, 87.0, 85.0, 68.0, 50.0, 53.0, 42.0, 20.0, 27.0, 13.0, 12.0, 12.0, 7.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.2369384765625, -4.110595703125, -3.9842529296875, -3.85791015625, -3.7315673828125, -3.605224609375, -3.4788818359375, -3.3525390625, -3.2261962890625, -3.099853515625, -2.9735107421875, -2.84716796875, -2.7208251953125, -2.594482421875, -2.4681396484375, -2.341796875, -2.2154541015625, -2.089111328125, -1.9627685546875, -1.83642578125, -1.7100830078125, -1.583740234375, -1.4573974609375, -1.3310546875, -1.2047119140625, -1.078369140625, -0.9520263671875, -0.82568359375, -0.6993408203125, -0.572998046875, -0.4466552734375, -0.3203125, -0.1939697265625, -0.067626953125, 0.0587158203125, 0.18505859375, 0.3114013671875, 0.437744140625, 0.5640869140625, 0.6904296875, 0.8167724609375, 0.943115234375, 1.0694580078125, 1.19580078125, 1.3221435546875, 1.448486328125, 1.5748291015625, 1.701171875, 1.8275146484375, 1.953857421875, 2.0802001953125, 2.20654296875, 2.3328857421875, 2.459228515625, 2.5855712890625, 2.7119140625, 2.8382568359375, 2.964599609375, 3.0909423828125, 3.21728515625, 3.3436279296875, 3.469970703125, 3.5963134765625, 3.72265625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 10.0, 15.0, 37.0, 52.0, 113.0, 305.0, 1071.0, 5556.0, 257568.0, 3898602.0, 27735.0, 2237.0, 586.0, 185.0, 85.0, 59.0, 19.0, 8.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.588134765625, -9.22314453125, -8.858154296875, -8.4931640625, -8.128173828125, -7.76318359375, -7.398193359375, -7.033203125, -6.668212890625, -6.30322265625, -5.938232421875, -5.5732421875, -5.208251953125, -4.84326171875, -4.478271484375, -4.11328125, -3.748291015625, -3.38330078125, -3.018310546875, -2.6533203125, -2.288330078125, -1.92333984375, -1.558349609375, -1.193359375, -0.828369140625, -0.46337890625, -0.098388671875, 0.2666015625, 0.631591796875, 0.99658203125, 1.361572265625, 1.7265625, 2.091552734375, 2.45654296875, 2.821533203125, 3.1865234375, 3.551513671875, 3.91650390625, 4.281494140625, 4.646484375, 5.011474609375, 5.37646484375, 5.741455078125, 6.1064453125, 6.471435546875, 6.83642578125, 7.201416015625, 7.56640625, 7.931396484375, 8.29638671875, 8.661376953125, 9.0263671875, 9.391357421875, 9.75634765625, 10.121337890625, 10.486328125, 10.851318359375, 11.21630859375, 11.581298828125, 11.9462890625, 12.311279296875, 12.67626953125, 13.041259765625, 13.40625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 2.0, 8.0, 13.0, 21.0, 36.0, 51.0, 82.0, 117.0, 235.0, 388.0, 653.0, 847.0, 664.0, 377.0, 225.0, 117.0, 78.0, 52.0, 24.0, 22.0, 17.0, 14.0, 5.0, 10.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.60003662109375, -1.5457763671875, -1.49151611328125, -1.437255859375, -1.38299560546875, -1.3287353515625, -1.27447509765625, -1.22021484375, -1.16595458984375, -1.1116943359375, -1.05743408203125, -1.003173828125, -0.94891357421875, -0.8946533203125, -0.84039306640625, -0.7861328125, -0.73187255859375, -0.6776123046875, -0.62335205078125, -0.569091796875, -0.51483154296875, -0.4605712890625, -0.40631103515625, -0.35205078125, -0.29779052734375, -0.2435302734375, -0.18927001953125, -0.135009765625, -0.08074951171875, -0.0264892578125, 0.02777099609375, 0.08203125, 0.13629150390625, 0.1905517578125, 0.24481201171875, 0.299072265625, 0.35333251953125, 0.4075927734375, 0.46185302734375, 0.51611328125, 0.57037353515625, 0.6246337890625, 0.67889404296875, 0.733154296875, 0.78741455078125, 0.8416748046875, 0.89593505859375, 0.9501953125, 1.00445556640625, 1.0587158203125, 1.11297607421875, 1.167236328125, 1.22149658203125, 1.2757568359375, 1.33001708984375, 1.38427734375, 1.43853759765625, 1.4927978515625, 1.54705810546875, 1.601318359375, 1.65557861328125, 1.7098388671875, 1.76409912109375, 1.818359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 10.0, 17.0, 19.0, 18.0, 30.0, 27.0, 35.0, 58.0, 50.0, 67.0, 78.0, 86.0, 67.0, 84.0, 78.0, 58.0, 48.0, 35.0, 33.0, 24.0, 17.0, 13.0, 11.0, 6.0, 6.0, 7.0, 6.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.5593817234039307, -3.433736562728882, -3.308091402053833, -3.182446241378784, -3.0568008422851562, -2.9311556816101074, -2.8055105209350586, -2.6798653602600098, -2.554220199584961, -2.428575038909912, -2.3029298782348633, -2.1772847175598145, -2.0516395568847656, -1.9259942770004272, -1.8003489971160889, -1.67470383644104, -1.5490586757659912, -1.4234135150909424, -1.2977683544158936, -1.1721230745315552, -1.0464779138565063, -0.9208327531814575, -0.7951875329017639, -0.6695423126220703, -0.5438971519470215, -0.41825196146965027, -0.29260677099227905, -0.16696158051490784, -0.04131639003753662, 0.08432877063751221, 0.2099739909172058, 0.3356192111968994, 0.46126461029052734, 0.5869097709655762, 0.7125549912452698, 0.8382002115249634, 0.9638453722000122, 1.089490532875061, 1.2151358127593994, 1.3407809734344482, 1.466426134109497, 1.592071294784546, 1.7177164554595947, 1.843361735343933, 1.969006896018982, 2.0946521759033203, 2.220297336578369, 2.345942497253418, 2.471587657928467, 2.5972328186035156, 2.7228779792785645, 2.8485231399536133, 2.974168300628662, 3.099813461303711, 3.225458860397339, 3.3511040210723877, 3.4767491817474365, 3.6023943424224854, 3.728039503097534, 3.853684663772583, 3.979330062866211, 4.10497522354126, 4.230620384216309, 4.356265544891357, 4.481910705566406]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 10.0, 1.0, 10.0, 7.0, 18.0, 15.0, 14.0, 26.0, 27.0, 31.0, 24.0, 28.0, 39.0, 44.0, 32.0, 46.0, 43.0, 47.0, 43.0, 46.0, 49.0, 49.0, 47.0, 45.0, 38.0, 25.0, 30.0, 32.0, 18.0, 22.0, 13.0, 13.0, 13.0, 9.0, 7.0, 8.0, 8.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.0234243869781494, -2.9325292110443115, -2.8416337966918945, -2.7507386207580566, -2.6598434448242188, -2.568948268890381, -2.478053092956543, -2.387157678604126, -2.296262502670288, -2.20536732673645, -2.114471912384033, -2.0235767364501953, -1.9326815605163574, -1.8417863845825195, -1.750891089439392, -1.6599957942962646, -1.5691006183624268, -1.4782054424285889, -1.3873101472854614, -1.296414852142334, -1.205519676208496, -1.1146245002746582, -1.0237292051315308, -0.9328339695930481, -0.8419387340545654, -0.7510434985160828, -0.6601482629776001, -0.5692530274391174, -0.47835779190063477, -0.3874625563621521, -0.29656732082366943, -0.20567208528518677, -0.114776611328125, -0.023881375789642334, 0.06701385974884033, 0.157909095287323, 0.24880433082580566, 0.33969956636428833, 0.430594801902771, 0.5214900374412537, 0.6123852729797363, 0.703280508518219, 0.7941757440567017, 0.8850709795951843, 0.975966215133667, 1.0668613910675049, 1.1577566862106323, 1.2486519813537598, 1.3395471572875977, 1.4304423332214355, 1.521337628364563, 1.6122329235076904, 1.7031280994415283, 1.7940232753753662, 1.8849185705184937, 1.975813865661621, 2.066709041595459, 2.157604217529297, 2.2484993934631348, 2.3393948078155518, 2.4302899837493896, 2.5211851596832275, 2.6120805740356445, 2.7029757499694824, 2.7938709259033203]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 3.0, 8.0, 11.0, 18.0, 19.0, 29.0, 62.0, 72.0, 102.0, 151.0, 266.0, 530.0, 1054.0, 2541.0, 6841.0, 23233.0, 118416.0, 657532.0, 190203.0, 32752.0, 8758.0, 3035.0, 1370.0, 657.0, 335.0, 225.0, 113.0, 78.0, 53.0, 30.0, 13.0, 16.0, 6.0, 7.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.73291015625, -0.7117385864257812, -0.6905670166015625, -0.6693954467773438, -0.648223876953125, -0.6270523071289062, -0.6058807373046875, -0.5847091674804688, -0.56353759765625, -0.5423660278320312, -0.5211944580078125, -0.5000228881835938, -0.478851318359375, -0.45767974853515625, -0.4365081787109375, -0.41533660888671875, -0.3941650390625, -0.37299346923828125, -0.3518218994140625, -0.33065032958984375, -0.309478759765625, -0.28830718994140625, -0.2671356201171875, -0.24596405029296875, -0.22479248046875, -0.20362091064453125, -0.1824493408203125, -0.16127777099609375, -0.140106201171875, -0.11893463134765625, -0.0977630615234375, -0.07659149169921875, -0.055419921875, -0.03424835205078125, -0.0130767822265625, 0.00809478759765625, 0.029266357421875, 0.05043792724609375, 0.0716094970703125, 0.09278106689453125, 0.11395263671875, 0.13512420654296875, 0.1562957763671875, 0.17746734619140625, 0.198638916015625, 0.21981048583984375, 0.2409820556640625, 0.26215362548828125, 0.2833251953125, 0.30449676513671875, 0.3256683349609375, 0.34683990478515625, 0.368011474609375, 0.38918304443359375, 0.4103546142578125, 0.43152618408203125, 0.45269775390625, 0.47386932373046875, 0.4950408935546875, 0.5162124633789062, 0.537384033203125, 0.5585556030273438, 0.5797271728515625, 0.6008987426757812, 0.6220703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 6.0, 12.0, 6.0, 16.0, 15.0, 31.0, 35.0, 39.0, 50.0, 54.0, 56.0, 73.0, 64.0, 69.0, 70.0, 71.0, 67.0, 55.0, 50.0, 25.0, 33.0, 21.0, 16.0, 15.0, 16.0, 8.0, 8.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4921875, -2.410003662109375, -2.32781982421875, -2.245635986328125, -2.1634521484375, -2.081268310546875, -1.99908447265625, -1.916900634765625, -1.834716796875, -1.752532958984375, -1.67034912109375, -1.588165283203125, -1.5059814453125, -1.423797607421875, -1.34161376953125, -1.259429931640625, -1.17724609375, -1.095062255859375, -1.01287841796875, -0.930694580078125, -0.8485107421875, -0.766326904296875, -0.68414306640625, -0.601959228515625, -0.519775390625, -0.437591552734375, -0.35540771484375, -0.273223876953125, -0.1910400390625, -0.108856201171875, -0.02667236328125, 0.055511474609375, 0.1376953125, 0.219879150390625, 0.30206298828125, 0.384246826171875, 0.4664306640625, 0.548614501953125, 0.63079833984375, 0.712982177734375, 0.795166015625, 0.877349853515625, 0.95953369140625, 1.041717529296875, 1.1239013671875, 1.206085205078125, 1.28826904296875, 1.370452880859375, 1.45263671875, 1.534820556640625, 1.61700439453125, 1.699188232421875, 1.7813720703125, 1.863555908203125, 1.94573974609375, 2.027923583984375, 2.110107421875, 2.192291259765625, 2.27447509765625, 2.356658935546875, 2.4388427734375, 2.521026611328125, 2.60321044921875, 2.685394287109375, 2.767578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 8.0, 6.0, 10.0, 16.0, 17.0, 29.0, 46.0, 61.0, 107.0, 168.0, 276.0, 405.0, 715.0, 1192.0, 1787.0, 3167.0, 5514.0, 10051.0, 19186.0, 38034.0, 82440.0, 195843.0, 352129.0, 183198.0, 77113.0, 36634.0, 18004.0, 9568.0, 5269.0, 3030.0, 1762.0, 1022.0, 647.0, 391.0, 259.0, 158.0, 108.0, 62.0, 37.0, 23.0, 18.0, 17.0, 10.0, 9.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.210205078125, -0.20330429077148438, -0.19640350341796875, -0.18950271606445312, -0.1826019287109375, -0.17570114135742188, -0.16880035400390625, -0.16189956665039062, -0.154998779296875, -0.14809799194335938, -0.14119720458984375, -0.13429641723632812, -0.1273956298828125, -0.12049484252929688, -0.11359405517578125, -0.10669326782226562, -0.09979248046875, -0.09289169311523438, -0.08599090576171875, -0.07909011840820312, -0.0721893310546875, -0.06528854370117188, -0.05838775634765625, -0.051486968994140625, -0.044586181640625, -0.037685394287109375, -0.03078460693359375, -0.023883819580078125, -0.0169830322265625, -0.010082244873046875, -0.00318145751953125, 0.003719329833984375, 0.0106201171875, 0.017520904541015625, 0.02442169189453125, 0.031322479248046875, 0.0382232666015625, 0.045124053955078125, 0.05202484130859375, 0.058925628662109375, 0.065826416015625, 0.07272720336914062, 0.07962799072265625, 0.08652877807617188, 0.0934295654296875, 0.10033035278320312, 0.10723114013671875, 0.11413192749023438, 0.12103271484375, 0.12793350219726562, 0.13483428955078125, 0.14173507690429688, 0.1486358642578125, 0.15553665161132812, 0.16243743896484375, 0.16933822631835938, 0.176239013671875, 0.18313980102539062, 0.19004058837890625, 0.19694137573242188, 0.2038421630859375, 0.21074295043945312, 0.21764373779296875, 0.22454452514648438, 0.2314453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 6.0, 6.0, 6.0, 13.0, 17.0, 9.0, 15.0, 18.0, 33.0, 24.0, 32.0, 37.0, 30.0, 32.0, 34.0, 40.0, 36.0, 43.0, 43.0, 63.0, 54.0, 46.0, 30.0, 36.0, 25.0, 30.0, 27.0, 35.0, 21.0, 25.0, 16.0, 18.0, 19.0, 12.0, 12.0, 12.0, 9.0, 3.0, 4.0, 3.0, 5.0, 5.0, 4.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.078125, -2.972900390625, -2.86767578125, -2.762451171875, -2.6572265625, -2.552001953125, -2.44677734375, -2.341552734375, -2.236328125, -2.131103515625, -2.02587890625, -1.920654296875, -1.8154296875, -1.710205078125, -1.60498046875, -1.499755859375, -1.39453125, -1.289306640625, -1.18408203125, -1.078857421875, -0.9736328125, -0.868408203125, -0.76318359375, -0.657958984375, -0.552734375, -0.447509765625, -0.34228515625, -0.237060546875, -0.1318359375, -0.026611328125, 0.07861328125, 0.183837890625, 0.2890625, 0.394287109375, 0.49951171875, 0.604736328125, 0.7099609375, 0.815185546875, 0.92041015625, 1.025634765625, 1.130859375, 1.236083984375, 1.34130859375, 1.446533203125, 1.5517578125, 1.656982421875, 1.76220703125, 1.867431640625, 1.97265625, 2.077880859375, 2.18310546875, 2.288330078125, 2.3935546875, 2.498779296875, 2.60400390625, 2.709228515625, 2.814453125, 2.919677734375, 3.02490234375, 3.130126953125, 3.2353515625, 3.340576171875, 3.44580078125, 3.551025390625, 3.65625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 10.0, 9.0, 13.0, 13.0, 21.0, 38.0, 40.0, 83.0, 129.0, 195.0, 292.0, 560.0, 956.0, 1843.0, 4468.0, 12969.0, 48032.0, 326534.0, 551631.0, 72354.0, 17588.0, 5866.0, 2362.0, 1076.0, 584.0, 335.0, 193.0, 122.0, 77.0, 49.0, 33.0, 24.0, 14.0, 8.0, 14.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.06353759765625, -0.06172895431518555, -0.059920310974121094, -0.05811166763305664, -0.05630302429199219, -0.054494380950927734, -0.05268573760986328, -0.05087709426879883, -0.049068450927734375, -0.04725980758666992, -0.04545116424560547, -0.043642520904541016, -0.04183387756347656, -0.04002523422241211, -0.038216590881347656, -0.0364079475402832, -0.03459930419921875, -0.0327906608581543, -0.030982017517089844, -0.02917337417602539, -0.027364730834960938, -0.025556087493896484, -0.02374744415283203, -0.021938800811767578, -0.020130157470703125, -0.018321514129638672, -0.01651287078857422, -0.014704227447509766, -0.012895584106445312, -0.01108694076538086, -0.009278297424316406, -0.007469654083251953, -0.0056610107421875, -0.003852367401123047, -0.0020437240600585938, -0.00023508071899414062, 0.0015735626220703125, 0.0033822059631347656, 0.005190849304199219, 0.006999492645263672, 0.008808135986328125, 0.010616779327392578, 0.012425422668457031, 0.014234066009521484, 0.016042709350585938, 0.01785135269165039, 0.019659996032714844, 0.021468639373779297, 0.02327728271484375, 0.025085926055908203, 0.026894569396972656, 0.02870321273803711, 0.030511856079101562, 0.032320499420166016, 0.03412914276123047, 0.03593778610229492, 0.037746429443359375, 0.03955507278442383, 0.04136371612548828, 0.043172359466552734, 0.04498100280761719, 0.04678964614868164, 0.048598289489746094, 0.05040693283081055, 0.052215576171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 2.0, 1.0, 8.0, 8.0, 9.0, 11.0, 13.0, 18.0, 26.0, 27.0, 35.0, 37.0, 46.0, 42.0, 62.0, 79.0, 76.0, 48.0, 63.0, 62.0, 60.0, 53.0, 38.0, 32.0, 28.0, 25.0, 17.0, 10.0, 7.0, 8.0, 8.0, 9.0, 7.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.24249267578125e-05, -3.152620047330856e-05, -3.0627474188804626e-05, -2.972874790430069e-05, -2.8830021619796753e-05, -2.7931295335292816e-05, -2.703256905078888e-05, -2.6133842766284943e-05, -2.5235116481781006e-05, -2.433639019727707e-05, -2.3437663912773132e-05, -2.2538937628269196e-05, -2.164021134376526e-05, -2.0741485059261322e-05, -1.9842758774757385e-05, -1.894403249025345e-05, -1.8045306205749512e-05, -1.7146579921245575e-05, -1.6247853636741638e-05, -1.53491273522377e-05, -1.4450401067733765e-05, -1.3551674783229828e-05, -1.2652948498725891e-05, -1.1754222214221954e-05, -1.0855495929718018e-05, -9.95676964521408e-06, -9.058043360710144e-06, -8.159317076206207e-06, -7.2605907917022705e-06, -6.361864507198334e-06, -5.463138222694397e-06, -4.56441193819046e-06, -3.6656856536865234e-06, -2.7669593691825867e-06, -1.86823308467865e-06, -9.695068001747131e-07, -7.078051567077637e-08, 8.279457688331604e-07, 1.7266720533370972e-06, 2.625398337841034e-06, 3.5241246223449707e-06, 4.4228509068489075e-06, 5.321577191352844e-06, 6.220303475856781e-06, 7.119029760360718e-06, 8.017756044864655e-06, 8.916482329368591e-06, 9.815208613872528e-06, 1.0713934898376465e-05, 1.1612661182880402e-05, 1.2511387467384338e-05, 1.3410113751888275e-05, 1.4308840036392212e-05, 1.5207566320896149e-05, 1.6106292605400085e-05, 1.7005018889904022e-05, 1.790374517440796e-05, 1.8802471458911896e-05, 1.9701197743415833e-05, 2.059992402791977e-05, 2.1498650312423706e-05, 2.2397376596927643e-05, 2.329610288143158e-05, 2.4194829165935516e-05, 2.5093555450439453e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 19.0, 23.0, 38.0, 52.0, 107.0, 298.0, 927.0, 4120.0, 33014.0, 749889.0, 240943.0, 15647.0, 2463.0, 546.0, 207.0, 91.0, 49.0, 24.0, 17.0, 11.0, 14.0, 10.0, 9.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.150146484375, -0.1460704803466797, -0.14199447631835938, -0.13791847229003906, -0.13384246826171875, -0.12976646423339844, -0.12569046020507812, -0.12161445617675781, -0.1175384521484375, -0.11346244812011719, -0.10938644409179688, -0.10531044006347656, -0.10123443603515625, -0.09715843200683594, -0.09308242797851562, -0.08900642395019531, -0.084930419921875, -0.08085441589355469, -0.07677841186523438, -0.07270240783691406, -0.06862640380859375, -0.06455039978027344, -0.060474395751953125, -0.05639839172363281, -0.0523223876953125, -0.04824638366699219, -0.044170379638671875, -0.04009437561035156, -0.03601837158203125, -0.03194236755371094, -0.027866363525390625, -0.023790359497070312, -0.01971435546875, -0.015638351440429688, -0.011562347412109375, -0.0074863433837890625, -0.00341033935546875, 0.0006656646728515625, 0.004741668701171875, 0.008817672729492188, 0.0128936767578125, 0.016969680786132812, 0.021045684814453125, 0.025121688842773438, 0.02919769287109375, 0.03327369689941406, 0.037349700927734375, 0.04142570495605469, 0.045501708984375, 0.04957771301269531, 0.053653717041015625, 0.05772972106933594, 0.06180572509765625, 0.06588172912597656, 0.06995773315429688, 0.07403373718261719, 0.0781097412109375, 0.08218574523925781, 0.08626174926757812, 0.09033775329589844, 0.09441375732421875, 0.09848976135253906, 0.10256576538085938, 0.10664176940917969, 0.1107177734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 8.0, 6.0, 6.0, 9.0, 14.0, 13.0, 10.0, 21.0, 21.0, 22.0, 23.0, 52.0, 75.0, 110.0, 105.0, 134.0, 85.0, 63.0, 38.0, 27.0, 25.0, 24.0, 13.0, 21.0, 19.0, 9.0, 13.0, 7.0, 4.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01727294921875, -0.01674628257751465, -0.016219615936279297, -0.015692949295043945, -0.015166282653808594, -0.014639616012573242, -0.01411294937133789, -0.013586282730102539, -0.013059616088867188, -0.012532949447631836, -0.012006282806396484, -0.011479616165161133, -0.010952949523925781, -0.01042628288269043, -0.009899616241455078, -0.009372949600219727, -0.008846282958984375, -0.008319616317749023, -0.007792949676513672, -0.00726628303527832, -0.006739616394042969, -0.006212949752807617, -0.005686283111572266, -0.005159616470336914, -0.0046329498291015625, -0.004106283187866211, -0.0035796165466308594, -0.003052949905395508, -0.0025262832641601562, -0.0019996166229248047, -0.0014729499816894531, -0.0009462833404541016, -0.00041961669921875, 0.00010704994201660156, 0.0006337165832519531, 0.0011603832244873047, 0.0016870498657226562, 0.002213716506958008, 0.0027403831481933594, 0.003267049789428711, 0.0037937164306640625, 0.004320383071899414, 0.004847049713134766, 0.005373716354370117, 0.005900382995605469, 0.00642704963684082, 0.006953716278076172, 0.0074803829193115234, 0.008007049560546875, 0.008533716201782227, 0.009060382843017578, 0.00958704948425293, 0.010113716125488281, 0.010640382766723633, 0.011167049407958984, 0.011693716049194336, 0.012220382690429688, 0.012747049331665039, 0.01327371597290039, 0.013800382614135742, 0.014327049255371094, 0.014853715896606445, 0.015380382537841797, 0.01590704917907715, 0.0164337158203125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 17.0, 19.0, 29.0, 42.0, 63.0, 83.0, 120.0, 119.0, 114.0, 111.0, 91.0, 60.0, 38.0, 29.0, 16.0, 10.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.538412570953369, -3.428050994873047, -3.3176894187927246, -3.2073278427124023, -3.09696626663208, -2.986604690551758, -2.8762431144714355, -2.7658815383911133, -2.655519962310791, -2.5451583862304688, -2.4347968101501465, -2.324435234069824, -2.214073657989502, -2.1037120819091797, -1.9933505058288574, -1.8829889297485352, -1.772627353668213, -1.6622657775878906, -1.5519042015075684, -1.441542625427246, -1.3311810493469238, -1.2208194732666016, -1.1104578971862793, -1.000096321105957, -0.8897347450256348, -0.7793731689453125, -0.6690115928649902, -0.558650016784668, -0.4482884407043457, -0.33792686462402344, -0.22756528854370117, -0.1172037124633789, -0.006842374801635742, 0.10351920127868652, 0.2138807773590088, 0.32424235343933105, 0.4346039295196533, 0.5449655055999756, 0.6553270816802979, 0.7656886577606201, 0.8760502338409424, 0.9864118099212646, 1.096773386001587, 1.2071349620819092, 1.3174965381622314, 1.4278581142425537, 1.538219690322876, 1.6485812664031982, 1.7589428424835205, 1.8693044185638428, 1.979665994644165, 2.0900275707244873, 2.2003891468048096, 2.310750722885132, 2.421112298965454, 2.5314738750457764, 2.6418354511260986, 2.752197027206421, 2.862558603286743, 2.9729201793670654, 3.0832817554473877, 3.19364333152771, 3.3040049076080322, 3.4143664836883545, 3.5247280597686768]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 4.0, 2.0, 5.0, 9.0, 9.0, 23.0, 16.0, 21.0, 32.0, 22.0, 35.0, 35.0, 41.0, 60.0, 42.0, 49.0, 52.0, 56.0, 52.0, 60.0, 44.0, 63.0, 40.0, 36.0, 35.0, 25.0, 28.0, 18.0, 15.0, 14.0, 7.0, 12.0, 10.0, 3.0, 5.0, 7.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9951624870300293, -1.933447003364563, -1.8717315196990967, -1.8100160360336304, -1.748300552368164, -1.6865849494934082, -1.624869465827942, -1.5631539821624756, -1.5014384984970093, -1.439723014831543, -1.3780075311660767, -1.3162920475006104, -1.2545764446258545, -1.1928610801696777, -1.1311454772949219, -1.0694299936294556, -1.0077145099639893, -0.945999026298523, -0.8842835426330566, -0.8225679993629456, -0.7608525156974792, -0.6991370320320129, -0.6374214887619019, -0.5757060050964355, -0.5139905214309692, -0.45227503776550293, -0.39055952429771423, -0.32884401082992554, -0.26712852716445923, -0.20541304349899292, -0.14369753003120422, -0.08198201656341553, -0.020266413688659668, 0.041449084877967834, 0.10316458344459534, 0.16488008201122284, 0.22659558057785034, 0.28831106424331665, 0.35002657771110535, 0.41174209117889404, 0.47345757484436035, 0.5351730585098267, 0.596888542175293, 0.658604085445404, 0.7203195691108704, 0.7820350527763367, 0.8437505960464478, 0.9054660797119141, 0.9671815633773804, 1.0288970470428467, 1.090612530708313, 1.1523280143737793, 1.2140436172485352, 1.275758981704712, 1.3374745845794678, 1.399190068244934, 1.4609055519104004, 1.5226210355758667, 1.584336519241333, 1.6460520029067993, 1.7077674865722656, 1.7694830894470215, 1.8311985731124878, 1.892914056777954, 1.9546295404434204]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 5.0, 7.0, 7.0, 7.0, 16.0, 19.0, 25.0, 20.0, 42.0, 57.0, 122.0, 300.0, 1115.0, 4333.0, 25008.0, 217968.0, 668072.0, 112472.0, 14752.0, 2921.0, 773.0, 231.0, 76.0, 70.0, 33.0, 23.0, 11.0, 11.0, 9.0, 6.0, 9.0, 3.0, 6.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.3203125, -5.1558837890625, -4.991455078125, -4.8270263671875, -4.66259765625, -4.4981689453125, -4.333740234375, -4.1693115234375, -4.0048828125, -3.8404541015625, -3.676025390625, -3.5115966796875, -3.34716796875, -3.1827392578125, -3.018310546875, -2.8538818359375, -2.689453125, -2.5250244140625, -2.360595703125, -2.1961669921875, -2.03173828125, -1.8673095703125, -1.702880859375, -1.5384521484375, -1.3740234375, -1.2095947265625, -1.045166015625, -0.8807373046875, -0.71630859375, -0.5518798828125, -0.387451171875, -0.2230224609375, -0.05859375, 0.1058349609375, 0.270263671875, 0.4346923828125, 0.59912109375, 0.7635498046875, 0.927978515625, 1.0924072265625, 1.2568359375, 1.4212646484375, 1.585693359375, 1.7501220703125, 1.91455078125, 2.0789794921875, 2.243408203125, 2.4078369140625, 2.572265625, 2.7366943359375, 2.901123046875, 3.0655517578125, 3.22998046875, 3.3944091796875, 3.558837890625, 3.7232666015625, 3.8876953125, 4.0521240234375, 4.216552734375, 4.3809814453125, 4.54541015625, 4.7098388671875, 4.874267578125, 5.0386962890625, 5.203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 9.0, 13.0, 12.0, 21.0, 27.0, 48.0, 51.0, 68.0, 97.0, 100.0, 94.0, 103.0, 93.0, 88.0, 66.0, 38.0, 28.0, 14.0, 15.0, 11.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.85333251953125, -3.6324462890625, -3.41156005859375, -3.190673828125, -2.96978759765625, -2.7489013671875, -2.52801513671875, -2.30712890625, -2.08624267578125, -1.8653564453125, -1.64447021484375, -1.423583984375, -1.20269775390625, -0.9818115234375, -0.76092529296875, -0.5400390625, -0.31915283203125, -0.0982666015625, 0.12261962890625, 0.343505859375, 0.56439208984375, 0.7852783203125, 1.00616455078125, 1.22705078125, 1.44793701171875, 1.6688232421875, 1.88970947265625, 2.110595703125, 2.33148193359375, 2.5523681640625, 2.77325439453125, 2.994140625, 3.21502685546875, 3.4359130859375, 3.65679931640625, 3.877685546875, 4.09857177734375, 4.3194580078125, 4.54034423828125, 4.76123046875, 4.98211669921875, 5.2030029296875, 5.42388916015625, 5.644775390625, 5.86566162109375, 6.0865478515625, 6.30743408203125, 6.5283203125, 6.74920654296875, 6.9700927734375, 7.19097900390625, 7.411865234375, 7.63275146484375, 7.8536376953125, 8.07452392578125, 8.29541015625, 8.51629638671875, 8.7371826171875, 8.95806884765625, 9.178955078125, 9.39984130859375, 9.6207275390625, 9.84161376953125, 10.0625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 3.0, 7.0, 10.0, 12.0, 19.0, 30.0, 28.0, 46.0, 44.0, 55.0, 95.0, 136.0, 180.0, 347.0, 687.0, 1559.0, 5324.0, 34061.0, 448777.0, 509013.0, 39033.0, 5639.0, 1652.0, 701.0, 399.0, 185.0, 142.0, 93.0, 77.0, 50.0, 39.0, 24.0, 20.0, 17.0, 16.0, 9.0, 9.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-5.76171875, -5.5924072265625, -5.423095703125, -5.2537841796875, -5.08447265625, -4.9151611328125, -4.745849609375, -4.5765380859375, -4.4072265625, -4.2379150390625, -4.068603515625, -3.8992919921875, -3.72998046875, -3.5606689453125, -3.391357421875, -3.2220458984375, -3.052734375, -2.8834228515625, -2.714111328125, -2.5447998046875, -2.37548828125, -2.2061767578125, -2.036865234375, -1.8675537109375, -1.6982421875, -1.5289306640625, -1.359619140625, -1.1903076171875, -1.02099609375, -0.8516845703125, -0.682373046875, -0.5130615234375, -0.34375, -0.1744384765625, -0.005126953125, 0.1641845703125, 0.33349609375, 0.5028076171875, 0.672119140625, 0.8414306640625, 1.0107421875, 1.1800537109375, 1.349365234375, 1.5186767578125, 1.68798828125, 1.8572998046875, 2.026611328125, 2.1959228515625, 2.365234375, 2.5345458984375, 2.703857421875, 2.8731689453125, 3.04248046875, 3.2117919921875, 3.381103515625, 3.5504150390625, 3.7197265625, 3.8890380859375, 4.058349609375, 4.2276611328125, 4.39697265625, 4.5662841796875, 4.735595703125, 4.9049072265625, 5.07421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 11.0, 7.0, 9.0, 10.0, 14.0, 18.0, 12.0, 19.0, 28.0, 31.0, 34.0, 29.0, 36.0, 43.0, 32.0, 36.0, 38.0, 41.0, 49.0, 47.0, 37.0, 46.0, 45.0, 43.0, 35.0, 39.0, 36.0, 29.0, 24.0, 21.0, 15.0, 17.0, 10.0, 9.0, 9.0, 7.0, 5.0, 3.0, 5.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.296875, -3.19189453125, -3.0869140625, -2.98193359375, -2.876953125, -2.77197265625, -2.6669921875, -2.56201171875, -2.45703125, -2.35205078125, -2.2470703125, -2.14208984375, -2.037109375, -1.93212890625, -1.8271484375, -1.72216796875, -1.6171875, -1.51220703125, -1.4072265625, -1.30224609375, -1.197265625, -1.09228515625, -0.9873046875, -0.88232421875, -0.77734375, -0.67236328125, -0.5673828125, -0.46240234375, -0.357421875, -0.25244140625, -0.1474609375, -0.04248046875, 0.0625, 0.16748046875, 0.2724609375, 0.37744140625, 0.482421875, 0.58740234375, 0.6923828125, 0.79736328125, 0.90234375, 1.00732421875, 1.1123046875, 1.21728515625, 1.322265625, 1.42724609375, 1.5322265625, 1.63720703125, 1.7421875, 1.84716796875, 1.9521484375, 2.05712890625, 2.162109375, 2.26708984375, 2.3720703125, 2.47705078125, 2.58203125, 2.68701171875, 2.7919921875, 2.89697265625, 3.001953125, 3.10693359375, 3.2119140625, 3.31689453125, 3.421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 8.0, 3.0, 9.0, 18.0, 33.0, 50.0, 75.0, 162.0, 422.0, 1246.0, 4173.0, 19111.0, 121082.0, 660341.0, 204422.0, 28910.0, 5928.0, 1610.0, 515.0, 182.0, 92.0, 64.0, 28.0, 18.0, 19.0, 14.0, 3.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.197845458984375, -1.15447998046875, -1.111114501953125, -1.0677490234375, -1.024383544921875, -0.98101806640625, -0.937652587890625, -0.894287109375, -0.850921630859375, -0.80755615234375, -0.764190673828125, -0.7208251953125, -0.677459716796875, -0.63409423828125, -0.590728759765625, -0.54736328125, -0.503997802734375, -0.46063232421875, -0.417266845703125, -0.3739013671875, -0.330535888671875, -0.28717041015625, -0.243804931640625, -0.200439453125, -0.157073974609375, -0.11370849609375, -0.070343017578125, -0.0269775390625, 0.016387939453125, 0.05975341796875, 0.103118896484375, 0.146484375, 0.189849853515625, 0.23321533203125, 0.276580810546875, 0.3199462890625, 0.363311767578125, 0.40667724609375, 0.450042724609375, 0.493408203125, 0.536773681640625, 0.58013916015625, 0.623504638671875, 0.6668701171875, 0.710235595703125, 0.75360107421875, 0.796966552734375, 0.84033203125, 0.883697509765625, 0.92706298828125, 0.970428466796875, 1.0137939453125, 1.057159423828125, 1.10052490234375, 1.143890380859375, 1.187255859375, 1.230621337890625, 1.27398681640625, 1.317352294921875, 1.3607177734375, 1.404083251953125, 1.44744873046875, 1.490814208984375, 1.5341796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 7.0, 14.0, 12.0, 16.0, 19.0, 31.0, 31.0, 47.0, 52.0, 75.0, 96.0, 90.0, 86.0, 66.0, 64.0, 48.0, 48.0, 49.0, 36.0, 28.0, 14.0, 12.0, 12.0, 10.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001437664031982422, -0.0001395680010318756, -0.00013536959886550903, -0.00013117119669914246, -0.00012697279453277588, -0.0001227743923664093, -0.00011857599020004272, -0.00011437758803367615, -0.00011017918586730957, -0.00010598078370094299, -0.00010178238153457642, -9.758397936820984e-05, -9.338557720184326e-05, -8.918717503547668e-05, -8.498877286911011e-05, -8.079037070274353e-05, -7.659196853637695e-05, -7.239356637001038e-05, -6.81951642036438e-05, -6.399676203727722e-05, -5.9798359870910645e-05, -5.559995770454407e-05, -5.140155553817749e-05, -4.720315337181091e-05, -4.3004751205444336e-05, -3.880634903907776e-05, -3.460794687271118e-05, -3.0409544706344604e-05, -2.6211142539978027e-05, -2.201274037361145e-05, -1.7814338207244873e-05, -1.3615936040878296e-05, -9.417533874511719e-06, -5.219131708145142e-06, -1.0207295417785645e-06, 3.1776726245880127e-06, 7.37607479095459e-06, 1.1574476957321167e-05, 1.5772879123687744e-05, 1.997128129005432e-05, 2.41696834564209e-05, 2.8368085622787476e-05, 3.256648778915405e-05, 3.676488995552063e-05, 4.096329212188721e-05, 4.5161694288253784e-05, 4.936009645462036e-05, 5.355849862098694e-05, 5.7756900787353516e-05, 6.195530295372009e-05, 6.615370512008667e-05, 7.035210728645325e-05, 7.455050945281982e-05, 7.87489116191864e-05, 8.294731378555298e-05, 8.714571595191956e-05, 9.134411811828613e-05, 9.554252028465271e-05, 9.974092245101929e-05, 0.00010393932461738586, 0.00010813772678375244, 0.00011233612895011902, 0.0001165345311164856, 0.00012073293328285217, 0.00012493133544921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 5.0, 6.0, 5.0, 4.0, 19.0, 12.0, 21.0, 21.0, 39.0, 57.0, 127.0, 202.0, 471.0, 1357.0, 5176.0, 28535.0, 233104.0, 662135.0, 98646.0, 13996.0, 2951.0, 903.0, 324.0, 179.0, 82.0, 51.0, 40.0, 26.0, 18.0, 14.0, 8.0, 7.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.180877685546875, -1.13421630859375, -1.087554931640625, -1.0408935546875, -0.994232177734375, -0.94757080078125, -0.900909423828125, -0.854248046875, -0.807586669921875, -0.76092529296875, -0.714263916015625, -0.6676025390625, -0.620941162109375, -0.57427978515625, -0.527618408203125, -0.48095703125, -0.434295654296875, -0.38763427734375, -0.340972900390625, -0.2943115234375, -0.247650146484375, -0.20098876953125, -0.154327392578125, -0.107666015625, -0.061004638671875, -0.01434326171875, 0.032318115234375, 0.0789794921875, 0.125640869140625, 0.17230224609375, 0.218963623046875, 0.265625, 0.312286376953125, 0.35894775390625, 0.405609130859375, 0.4522705078125, 0.498931884765625, 0.54559326171875, 0.592254638671875, 0.638916015625, 0.685577392578125, 0.73223876953125, 0.778900146484375, 0.8255615234375, 0.872222900390625, 0.91888427734375, 0.965545654296875, 1.01220703125, 1.058868408203125, 1.10552978515625, 1.152191162109375, 1.1988525390625, 1.245513916015625, 1.29217529296875, 1.338836669921875, 1.385498046875, 1.432159423828125, 1.47882080078125, 1.525482177734375, 1.5721435546875, 1.618804931640625, 1.66546630859375, 1.712127685546875, 1.7587890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 6.0, 8.0, 9.0, 14.0, 22.0, 22.0, 15.0, 20.0, 32.0, 31.0, 69.0, 65.0, 80.0, 71.0, 78.0, 72.0, 86.0, 56.0, 53.0, 30.0, 27.0, 20.0, 22.0, 16.0, 21.0, 13.0, 7.0, 5.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37890625, -0.3656883239746094, -0.35247039794921875, -0.3392524719238281, -0.3260345458984375, -0.3128166198730469, -0.29959869384765625, -0.2863807678222656, -0.273162841796875, -0.2599449157714844, -0.24672698974609375, -0.23350906372070312, -0.2202911376953125, -0.20707321166992188, -0.19385528564453125, -0.18063735961914062, -0.16741943359375, -0.15420150756835938, -0.14098358154296875, -0.12776565551757812, -0.1145477294921875, -0.10132980346679688, -0.08811187744140625, -0.07489395141601562, -0.061676025390625, -0.048458099365234375, -0.03524017333984375, -0.022022247314453125, -0.0088043212890625, 0.004413604736328125, 0.01763153076171875, 0.030849456787109375, 0.0440673828125, 0.057285308837890625, 0.07050323486328125, 0.08372116088867188, 0.0969390869140625, 0.11015701293945312, 0.12337493896484375, 0.13659286499023438, 0.149810791015625, 0.16302871704101562, 0.17624664306640625, 0.18946456909179688, 0.2026824951171875, 0.21590042114257812, 0.22911834716796875, 0.24233627319335938, 0.25555419921875, 0.2687721252441406, 0.28199005126953125, 0.2952079772949219, 0.3084259033203125, 0.3216438293457031, 0.33486175537109375, 0.3480796813964844, 0.361297607421875, 0.3745155334472656, 0.38773345947265625, 0.4009513854980469, 0.4141693115234375, 0.4273872375488281, 0.44060516357421875, 0.4538230895996094, 0.467041015625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 8.0, 8.0, 19.0, 51.0, 89.0, 150.0, 230.0, 204.0, 121.0, 71.0, 34.0, 15.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.65155291557312, -3.2425835132598877, -2.8336143493652344, -2.424644947052002, -2.0156755447387695, -1.606706142425537, -1.1977369785308838, -0.7887675762176514, -0.37979817390441895, 0.0291711688041687, 0.43814051151275635, 0.8471097946166992, 1.2560791969299316, 1.665048599243164, 2.0740177631378174, 2.48298716545105, 2.8919565677642822, 3.3009259700775146, 3.709895133972168, 4.1188645362854, 4.527833938598633, 4.936803340911865, 5.345772743225098, 5.754741668701172, 6.1637115478515625, 6.572680950164795, 6.981650352478027, 7.390619277954102, 7.799589157104492, 8.208558082580566, 8.61752700805664, 9.026496887207031, 9.435466766357422, 9.844435691833496, 10.253405570983887, 10.662374496459961, 11.071344375610352, 11.480313301086426, 11.8892822265625, 12.29825210571289, 12.707221984863281, 13.116190910339355, 13.525160789489746, 13.93412971496582, 14.343099594116211, 14.752068519592285, 15.16103744506836, 15.57000732421875, 15.978976249694824, 16.3879451751709, 16.79691505432129, 17.20588493347168, 17.614852905273438, 18.023822784423828, 18.43279266357422, 18.84176254272461, 19.250730514526367, 19.659700393676758, 20.068668365478516, 20.477638244628906, 20.886608123779297, 21.295578002929688, 21.704545974731445, 22.113515853881836, 22.522485733032227]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 7.0, 11.0, 13.0, 21.0, 21.0, 18.0, 35.0, 26.0, 36.0, 33.0, 47.0, 37.0, 52.0, 51.0, 43.0, 54.0, 57.0, 53.0, 47.0, 50.0, 39.0, 56.0, 33.0, 28.0, 29.0, 27.0, 17.0, 12.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.408663272857666, -6.17978572845459, -5.9509077072143555, -5.722030162811279, -5.493152141571045, -5.264274597167969, -5.035396575927734, -4.806519031524658, -4.577641487121582, -4.348763942718506, -4.1198859214782715, -3.8910083770751953, -3.662130355834961, -3.4332528114318848, -3.2043750286102295, -2.975497245788574, -2.74661922454834, -2.5177414417266846, -2.2888636589050293, -2.059986114501953, -1.8311082124710083, -1.602230429649353, -1.3733527660369873, -1.144474983215332, -0.9155972003936768, -0.6867194175720215, -0.457841694355011, -0.2289639711380005, -8.618831634521484e-05, 0.22879159450531006, 0.4576692581176758, 0.686547040939331, 0.9154243469238281, 1.1443021297454834, 1.3731799125671387, 1.6020575761795044, 1.8309353590011597, 2.0598130226135254, 2.2886908054351807, 2.517568588256836, 2.746446371078491, 2.9753241539001465, 3.2042019367218018, 3.433079719543457, 3.661957263946533, 3.8908352851867676, 4.119712829589844, 4.348590850830078, 4.577468395233154, 4.8063459396362305, 5.035223960876465, 5.264101505279541, 5.492979526519775, 5.721857070922852, 5.950735092163086, 6.179612636566162, 6.408490180969238, 6.6373677253723145, 6.866245746612549, 7.095123291015625, 7.324001312255859, 7.5528788566589355, 7.781756401062012, 8.010634422302246, 8.23951244354248]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 6.0, 12.0, 18.0, 30.0, 35.0, 76.0, 137.0, 234.0, 414.0, 904.0, 1858.0, 4596.0, 12862.0, 49524.0, 326270.0, 2033071.0, 1489402.0, 220295.0, 36977.0, 10580.0, 3792.0, 1660.0, 761.0, 356.0, 172.0, 93.0, 60.0, 31.0, 18.0, 13.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.900390625, -2.779022216796875, -2.65765380859375, -2.536285400390625, -2.4149169921875, -2.293548583984375, -2.17218017578125, -2.050811767578125, -1.929443359375, -1.808074951171875, -1.68670654296875, -1.565338134765625, -1.4439697265625, -1.322601318359375, -1.20123291015625, -1.079864501953125, -0.95849609375, -0.837127685546875, -0.71575927734375, -0.594390869140625, -0.4730224609375, -0.351654052734375, -0.23028564453125, -0.108917236328125, 0.012451171875, 0.133819580078125, 0.25518798828125, 0.376556396484375, 0.4979248046875, 0.619293212890625, 0.74066162109375, 0.862030029296875, 0.9833984375, 1.104766845703125, 1.22613525390625, 1.347503662109375, 1.4688720703125, 1.590240478515625, 1.71160888671875, 1.832977294921875, 1.954345703125, 2.075714111328125, 2.19708251953125, 2.318450927734375, 2.4398193359375, 2.561187744140625, 2.68255615234375, 2.803924560546875, 2.92529296875, 3.046661376953125, 3.16802978515625, 3.289398193359375, 3.4107666015625, 3.532135009765625, 3.65350341796875, 3.774871826171875, 3.896240234375, 4.017608642578125, 4.13897705078125, 4.260345458984375, 4.3817138671875, 4.503082275390625, 4.62445068359375, 4.745819091796875, 4.8671875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 13.0, 13.0, 17.0, 19.0, 21.0, 34.0, 44.0, 39.0, 34.0, 60.0, 60.0, 56.0, 58.0, 54.0, 68.0, 65.0, 53.0, 51.0, 51.0, 46.0, 33.0, 20.0, 16.0, 11.0, 12.0, 8.0, 11.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.400390625, -3.286590576171875, -3.17279052734375, -3.058990478515625, -2.9451904296875, -2.831390380859375, -2.71759033203125, -2.603790283203125, -2.489990234375, -2.376190185546875, -2.26239013671875, -2.148590087890625, -2.0347900390625, -1.920989990234375, -1.80718994140625, -1.693389892578125, -1.57958984375, -1.465789794921875, -1.35198974609375, -1.238189697265625, -1.1243896484375, -1.010589599609375, -0.89678955078125, -0.782989501953125, -0.669189453125, -0.555389404296875, -0.44158935546875, -0.327789306640625, -0.2139892578125, -0.100189208984375, 0.01361083984375, 0.127410888671875, 0.2412109375, 0.355010986328125, 0.46881103515625, 0.582611083984375, 0.6964111328125, 0.810211181640625, 0.92401123046875, 1.037811279296875, 1.151611328125, 1.265411376953125, 1.37921142578125, 1.493011474609375, 1.6068115234375, 1.720611572265625, 1.83441162109375, 1.948211669921875, 2.06201171875, 2.175811767578125, 2.28961181640625, 2.403411865234375, 2.5172119140625, 2.631011962890625, 2.74481201171875, 2.858612060546875, 2.972412109375, 3.086212158203125, 3.20001220703125, 3.313812255859375, 3.4276123046875, 3.541412353515625, 3.65521240234375, 3.769012451171875, 3.8828125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [4.0, 3.0, 7.0, 17.0, 51.0, 184.0, 797.0, 10090.0, 4155691.0, 26203.0, 947.0, 183.0, 80.0, 29.0, 7.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6796875, -5.0181884765625, -4.356689453125, -3.6951904296875, -3.03369140625, -2.3721923828125, -1.710693359375, -1.0491943359375, -0.3876953125, 0.2738037109375, 0.935302734375, 1.5968017578125, 2.25830078125, 2.9197998046875, 3.581298828125, 4.2427978515625, 4.904296875, 5.5657958984375, 6.227294921875, 6.8887939453125, 7.55029296875, 8.2117919921875, 8.873291015625, 9.5347900390625, 10.1962890625, 10.8577880859375, 11.519287109375, 12.1807861328125, 12.84228515625, 13.5037841796875, 14.165283203125, 14.8267822265625, 15.48828125, 16.1497802734375, 16.811279296875, 17.4727783203125, 18.13427734375, 18.7957763671875, 19.457275390625, 20.1187744140625, 20.7802734375, 21.4417724609375, 22.103271484375, 22.7647705078125, 23.42626953125, 24.0877685546875, 24.749267578125, 25.4107666015625, 26.072265625, 26.7337646484375, 27.395263671875, 28.0567626953125, 28.71826171875, 29.3797607421875, 30.041259765625, 30.7027587890625, 31.3642578125, 32.0257568359375, 32.687255859375, 33.3487548828125, 34.01025390625, 34.6717529296875, 35.333251953125, 35.9947509765625, 36.65625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 18.0, 24.0, 45.0, 47.0, 67.0, 142.0, 236.0, 429.0, 806.0, 942.0, 625.0, 295.0, 155.0, 101.0, 53.0, 34.0, 17.0, 11.0, 8.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.2734375, -2.2154388427734375, -2.157440185546875, -2.0994415283203125, -2.04144287109375, -1.9834442138671875, -1.925445556640625, -1.8674468994140625, -1.8094482421875, -1.7514495849609375, -1.693450927734375, -1.6354522705078125, -1.57745361328125, -1.5194549560546875, -1.461456298828125, -1.4034576416015625, -1.345458984375, -1.2874603271484375, -1.229461669921875, -1.1714630126953125, -1.11346435546875, -1.0554656982421875, -0.997467041015625, -0.9394683837890625, -0.8814697265625, -0.8234710693359375, -0.765472412109375, -0.7074737548828125, -0.64947509765625, -0.5914764404296875, -0.533477783203125, -0.4754791259765625, -0.41748046875, -0.3594818115234375, -0.301483154296875, -0.2434844970703125, -0.18548583984375, -0.1274871826171875, -0.069488525390625, -0.0114898681640625, 0.0465087890625, 0.1045074462890625, 0.162506103515625, 0.2205047607421875, 0.27850341796875, 0.3365020751953125, 0.394500732421875, 0.4524993896484375, 0.510498046875, 0.5684967041015625, 0.626495361328125, 0.6844940185546875, 0.74249267578125, 0.8004913330078125, 0.858489990234375, 0.9164886474609375, 0.9744873046875, 1.0324859619140625, 1.090484619140625, 1.1484832763671875, 1.20648193359375, 1.2644805908203125, 1.322479248046875, 1.3804779052734375, 1.4384765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 7.0, 13.0, 16.0, 22.0, 22.0, 29.0, 46.0, 58.0, 68.0, 76.0, 91.0, 95.0, 87.0, 98.0, 65.0, 58.0, 43.0, 21.0, 19.0, 22.0, 12.0, 10.0, 5.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.605706691741943, -5.464009761810303, -5.322312355041504, -5.180615425109863, -5.038918495178223, -4.897221088409424, -4.755524158477783, -4.613826751708984, -4.472129821777344, -4.330432891845703, -4.188735485076904, -4.047038555145264, -3.905341386795044, -3.763644218444824, -3.6219472885131836, -3.480250120162964, -3.338552951812744, -3.1968557834625244, -3.0551586151123047, -2.913461685180664, -2.7717645168304443, -2.6300673484802246, -2.488370418548584, -2.3466732501983643, -2.2049760818481445, -2.063278913497925, -1.9215818643569946, -1.7798848152160645, -1.6381876468658447, -1.496490478515625, -1.3547934293746948, -1.2130963802337646, -1.071399211883545, -0.92970210313797, -0.788004994392395, -0.6463078856468201, -0.5046107769012451, -0.36291366815567017, -0.22121655941009521, -0.07951945066452026, 0.06217765808105469, 0.20387476682662964, 0.3455718755722046, 0.48726898431777954, 0.6289660930633545, 0.7706632018089294, 0.9123603105545044, 1.0540573596954346, 1.1957545280456543, 1.337451696395874, 1.4791487455368042, 1.6208457946777344, 1.762542963027954, 1.9042401313781738, 2.0459370613098145, 2.187634229660034, 2.329331398010254, 2.4710285663604736, 2.6127257347106934, 2.754422664642334, 2.8961198329925537, 3.0378170013427734, 3.179513931274414, 3.321211099624634, 3.4629082679748535]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 1.0, 10.0, 3.0, 8.0, 17.0, 22.0, 14.0, 16.0, 33.0, 22.0, 34.0, 46.0, 43.0, 29.0, 38.0, 59.0, 42.0, 49.0, 47.0, 59.0, 47.0, 55.0, 45.0, 48.0, 36.0, 29.0, 22.0, 17.0, 27.0, 21.0, 12.0, 9.0, 9.0, 5.0, 5.0, 7.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.914206027984619, -2.811676502227783, -2.7091469764709473, -2.6066174507141113, -2.5040876865386963, -2.4015581607818604, -2.2990286350250244, -2.1964991092681885, -2.0939693450927734, -1.9914398193359375, -1.888910174369812, -1.786380648612976, -1.6838510036468506, -1.5813214778900146, -1.4787919521331787, -1.3762624263763428, -1.2737329006195068, -1.171203374862671, -1.0686737298965454, -0.9661442041397095, -0.8636146187782288, -0.761085033416748, -0.6585555076599121, -0.5560259222984314, -0.4534963369369507, -0.35096675157546997, -0.24843719601631165, -0.14590764045715332, -0.04337805509567261, 0.059151530265808105, 0.16168105602264404, 0.26421064138412476, 0.36674046516418457, 0.4692700505256653, 0.571799635887146, 0.6743291616439819, 0.7768587470054626, 0.8793883323669434, 0.9819178581237793, 1.0844473838806152, 1.1869770288467407, 1.2895065546035767, 1.3920361995697021, 1.494565725326538, 1.597095251083374, 1.6996248960494995, 1.8021544218063354, 1.904684066772461, 2.007213592529297, 2.109743118286133, 2.2122726440429688, 2.3148021697998047, 2.4173319339752197, 2.5198614597320557, 2.6223909854888916, 2.7249205112457275, 2.8274502754211426, 2.9299798011779785, 3.0325093269348145, 3.1350388526916504, 3.2375686168670654, 3.3400981426239014, 3.4426276683807373, 3.5451571941375732, 3.647686719894409]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 11.0, 14.0, 15.0, 21.0, 31.0, 41.0, 78.0, 106.0, 140.0, 203.0, 319.0, 469.0, 720.0, 1267.0, 2079.0, 3513.0, 6143.0, 11999.0, 24165.0, 55152.0, 148756.0, 417087.0, 231591.0, 77988.0, 32414.0, 15391.0, 7811.0, 4261.0, 2514.0, 1525.0, 943.0, 571.0, 402.0, 264.0, 155.0, 115.0, 69.0, 61.0, 42.0, 32.0, 27.0, 14.0, 10.0, 8.0, 8.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36083984375, -0.3494529724121094, -0.33806610107421875, -0.3266792297363281, -0.3152923583984375, -0.3039054870605469, -0.29251861572265625, -0.2811317443847656, -0.269744873046875, -0.2583580017089844, -0.24697113037109375, -0.23558425903320312, -0.2241973876953125, -0.21281051635742188, -0.20142364501953125, -0.19003677368164062, -0.17864990234375, -0.16726303100585938, -0.15587615966796875, -0.14448928833007812, -0.1331024169921875, -0.12171554565429688, -0.11032867431640625, -0.09894180297851562, -0.087554931640625, -0.07616806030273438, -0.06478118896484375, -0.053394317626953125, -0.0420074462890625, -0.030620574951171875, -0.01923370361328125, -0.007846832275390625, 0.0035400390625, 0.014926910400390625, 0.02631378173828125, 0.037700653076171875, 0.0490875244140625, 0.060474395751953125, 0.07186126708984375, 0.08324813842773438, 0.094635009765625, 0.10602188110351562, 0.11740875244140625, 0.12879562377929688, 0.1401824951171875, 0.15156936645507812, 0.16295623779296875, 0.17434310913085938, 0.18572998046875, 0.19711685180664062, 0.20850372314453125, 0.21989059448242188, 0.2312774658203125, 0.24266433715820312, 0.25405120849609375, 0.2654380798339844, 0.276824951171875, 0.2882118225097656, 0.29959869384765625, 0.3109855651855469, 0.3223724365234375, 0.3337593078613281, 0.34514617919921875, 0.3565330505371094, 0.367919921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 8.0, 1.0, 4.0, 4.0, 11.0, 10.0, 17.0, 19.0, 26.0, 27.0, 25.0, 33.0, 51.0, 48.0, 41.0, 37.0, 60.0, 52.0, 57.0, 63.0, 54.0, 56.0, 51.0, 48.0, 32.0, 36.0, 35.0, 26.0, 21.0, 15.0, 8.0, 9.0, 4.0, 1.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.28021240234375, -2.2069091796875, -2.13360595703125, -2.060302734375, -1.98699951171875, -1.9136962890625, -1.84039306640625, -1.76708984375, -1.69378662109375, -1.6204833984375, -1.54718017578125, -1.473876953125, -1.40057373046875, -1.3272705078125, -1.25396728515625, -1.1806640625, -1.10736083984375, -1.0340576171875, -0.96075439453125, -0.887451171875, -0.81414794921875, -0.7408447265625, -0.66754150390625, -0.59423828125, -0.52093505859375, -0.4476318359375, -0.37432861328125, -0.301025390625, -0.22772216796875, -0.1544189453125, -0.08111572265625, -0.0078125, 0.06549072265625, 0.1387939453125, 0.21209716796875, 0.285400390625, 0.35870361328125, 0.4320068359375, 0.50531005859375, 0.57861328125, 0.65191650390625, 0.7252197265625, 0.79852294921875, 0.871826171875, 0.94512939453125, 1.0184326171875, 1.09173583984375, 1.1650390625, 1.23834228515625, 1.3116455078125, 1.38494873046875, 1.458251953125, 1.53155517578125, 1.6048583984375, 1.67816162109375, 1.75146484375, 1.82476806640625, 1.8980712890625, 1.97137451171875, 2.044677734375, 2.11798095703125, 2.1912841796875, 2.26458740234375, 2.337890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 7.0, 8.0, 12.0, 19.0, 15.0, 39.0, 36.0, 67.0, 72.0, 119.0, 202.0, 301.0, 486.0, 745.0, 1205.0, 1848.0, 3113.0, 4994.0, 8485.0, 14834.0, 27035.0, 51995.0, 107687.0, 240231.0, 296926.0, 141787.0, 66726.0, 34147.0, 18599.0, 10586.0, 6416.0, 3790.0, 2281.0, 1360.0, 842.0, 575.0, 336.0, 211.0, 151.0, 96.0, 48.0, 44.0, 31.0, 16.0, 18.0, 9.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1900634765625, -0.1833171844482422, -0.17657089233398438, -0.16982460021972656, -0.16307830810546875, -0.15633201599121094, -0.14958572387695312, -0.1428394317626953, -0.1360931396484375, -0.1293468475341797, -0.12260055541992188, -0.11585426330566406, -0.10910797119140625, -0.10236167907714844, -0.09561538696289062, -0.08886909484863281, -0.082122802734375, -0.07537651062011719, -0.06863021850585938, -0.06188392639160156, -0.05513763427734375, -0.04839134216308594, -0.041645050048828125, -0.03489875793457031, -0.0281524658203125, -0.021406173706054688, -0.014659881591796875, -0.007913589477539062, -0.00116729736328125, 0.0055789947509765625, 0.012325286865234375, 0.019071578979492188, 0.02581787109375, 0.03256416320800781, 0.039310455322265625, 0.04605674743652344, 0.05280303955078125, 0.05954933166503906, 0.06629562377929688, 0.07304191589355469, 0.0797882080078125, 0.08653450012207031, 0.09328079223632812, 0.10002708435058594, 0.10677337646484375, 0.11351966857910156, 0.12026596069335938, 0.1270122528076172, 0.133758544921875, 0.1405048370361328, 0.14725112915039062, 0.15399742126464844, 0.16074371337890625, 0.16749000549316406, 0.17423629760742188, 0.1809825897216797, 0.1877288818359375, 0.1944751739501953, 0.20122146606445312, 0.20796775817871094, 0.21471405029296875, 0.22146034240722656, 0.22820663452148438, 0.2349529266357422, 0.24169921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 5.0, 3.0, 12.0, 7.0, 9.0, 11.0, 8.0, 11.0, 16.0, 15.0, 19.0, 28.0, 29.0, 34.0, 29.0, 36.0, 33.0, 29.0, 29.0, 39.0, 33.0, 45.0, 51.0, 35.0, 56.0, 44.0, 37.0, 42.0, 35.0, 46.0, 32.0, 21.0, 19.0, 23.0, 15.0, 13.0, 12.0, 13.0, 13.0, 5.0, 1.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5625, -3.4384765625, -3.314453125, -3.1904296875, -3.06640625, -2.9423828125, -2.818359375, -2.6943359375, -2.5703125, -2.4462890625, -2.322265625, -2.1982421875, -2.07421875, -1.9501953125, -1.826171875, -1.7021484375, -1.578125, -1.4541015625, -1.330078125, -1.2060546875, -1.08203125, -0.9580078125, -0.833984375, -0.7099609375, -0.5859375, -0.4619140625, -0.337890625, -0.2138671875, -0.08984375, 0.0341796875, 0.158203125, 0.2822265625, 0.40625, 0.5302734375, 0.654296875, 0.7783203125, 0.90234375, 1.0263671875, 1.150390625, 1.2744140625, 1.3984375, 1.5224609375, 1.646484375, 1.7705078125, 1.89453125, 2.0185546875, 2.142578125, 2.2666015625, 2.390625, 2.5146484375, 2.638671875, 2.7626953125, 2.88671875, 3.0107421875, 3.134765625, 3.2587890625, 3.3828125, 3.5068359375, 3.630859375, 3.7548828125, 3.87890625, 4.0029296875, 4.126953125, 4.2509765625, 4.375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 18.0, 29.0, 38.0, 65.0, 111.0, 172.0, 261.0, 487.0, 910.0, 1851.0, 4970.0, 19945.0, 278311.0, 700155.0, 30931.0, 6095.0, 2105.0, 890.0, 462.0, 247.0, 158.0, 100.0, 73.0, 43.0, 30.0, 19.0, 12.0, 6.0, 6.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.110107421875, -0.10667991638183594, -0.10325241088867188, -0.09982490539550781, -0.09639739990234375, -0.09296989440917969, -0.08954238891601562, -0.08611488342285156, -0.0826873779296875, -0.07925987243652344, -0.07583236694335938, -0.07240486145019531, -0.06897735595703125, -0.06554985046386719, -0.062122344970703125, -0.05869483947753906, -0.055267333984375, -0.05183982849121094, -0.048412322998046875, -0.04498481750488281, -0.04155731201171875, -0.03812980651855469, -0.034702301025390625, -0.03127479553222656, -0.0278472900390625, -0.024419784545898438, -0.020992279052734375, -0.017564773559570312, -0.01413726806640625, -0.010709762573242188, -0.007282257080078125, -0.0038547515869140625, -0.00042724609375, 0.0030002593994140625, 0.006427764892578125, 0.009855270385742188, 0.01328277587890625, 0.016710281372070312, 0.020137786865234375, 0.023565292358398438, 0.0269927978515625, 0.030420303344726562, 0.033847808837890625, 0.03727531433105469, 0.04070281982421875, 0.04413032531738281, 0.047557830810546875, 0.05098533630371094, 0.054412841796875, 0.05784034729003906, 0.061267852783203125, 0.06469535827636719, 0.06812286376953125, 0.07155036926269531, 0.07497787475585938, 0.07840538024902344, 0.0818328857421875, 0.08526039123535156, 0.08868789672851562, 0.09211540222167969, 0.09554290771484375, 0.09897041320800781, 0.10239791870117188, 0.10582542419433594, 0.1092529296875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 11.0, 11.0, 15.0, 36.0, 43.0, 105.0, 104.0, 179.0, 161.0, 134.0, 70.0, 50.0, 28.0, 22.0, 16.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.253885269165039e-05, -7.012765854597092e-05, -6.771646440029144e-05, -6.530527025461197e-05, -6.28940761089325e-05, -6.048288196325302e-05, -5.807168781757355e-05, -5.5660493671894073e-05, -5.32492995262146e-05, -5.0838105380535126e-05, -4.842691123485565e-05, -4.601571708917618e-05, -4.3604522943496704e-05, -4.119332879781723e-05, -3.8782134652137756e-05, -3.637094050645828e-05, -3.395974636077881e-05, -3.1548552215099335e-05, -2.913735806941986e-05, -2.6726163923740387e-05, -2.4314969778060913e-05, -2.190377563238144e-05, -1.9492581486701965e-05, -1.708138734102249e-05, -1.4670193195343018e-05, -1.2258999049663544e-05, -9.84780490398407e-06, -7.436610758304596e-06, -5.025416612625122e-06, -2.614222466945648e-06, -2.0302832126617432e-07, 2.2081658244132996e-06, 4.6193599700927734e-06, 7.030554115772247e-06, 9.441748261451721e-06, 1.1852942407131195e-05, 1.4264136552810669e-05, 1.6675330698490143e-05, 1.9086524844169617e-05, 2.149771898984909e-05, 2.3908913135528564e-05, 2.632010728120804e-05, 2.8731301426887512e-05, 3.1142495572566986e-05, 3.355368971824646e-05, 3.5964883863925934e-05, 3.837607800960541e-05, 4.078727215528488e-05, 4.3198466300964355e-05, 4.560966044664383e-05, 4.80208545923233e-05, 5.043204873800278e-05, 5.284324288368225e-05, 5.5254437029361725e-05, 5.76656311750412e-05, 6.007682532072067e-05, 6.248801946640015e-05, 6.489921361207962e-05, 6.73104077577591e-05, 6.972160190343857e-05, 7.213279604911804e-05, 7.454399019479752e-05, 7.695518434047699e-05, 7.936637848615646e-05, 8.177757263183594e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 2.0, 5.0, 4.0, 12.0, 28.0, 49.0, 82.0, 207.0, 496.0, 1303.0, 4371.0, 19893.0, 353567.0, 636513.0, 24717.0, 4941.0, 1483.0, 491.0, 196.0, 83.0, 46.0, 17.0, 11.0, 6.0, 9.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.1457233428955078, -0.14117813110351562, -0.13663291931152344, -0.13208770751953125, -0.12754249572753906, -0.12299728393554688, -0.11845207214355469, -0.1139068603515625, -0.10936164855957031, -0.10481643676757812, -0.10027122497558594, -0.09572601318359375, -0.09118080139160156, -0.08663558959960938, -0.08209037780761719, -0.077545166015625, -0.07299995422363281, -0.06845474243164062, -0.06390953063964844, -0.05936431884765625, -0.05481910705566406, -0.050273895263671875, -0.04572868347167969, -0.0411834716796875, -0.03663825988769531, -0.032093048095703125, -0.027547836303710938, -0.02300262451171875, -0.018457412719726562, -0.013912200927734375, -0.009366989135742188, -0.00482177734375, -0.0002765655517578125, 0.004268646240234375, 0.008813858032226562, 0.01335906982421875, 0.017904281616210938, 0.022449493408203125, 0.026994705200195312, 0.0315399169921875, 0.03608512878417969, 0.040630340576171875, 0.04517555236816406, 0.04972076416015625, 0.05426597595214844, 0.058811187744140625, 0.06335639953613281, 0.067901611328125, 0.07244682312011719, 0.07699203491210938, 0.08153724670410156, 0.08608245849609375, 0.09062767028808594, 0.09517288208007812, 0.09971809387207031, 0.1042633056640625, 0.10880851745605469, 0.11335372924804688, 0.11789894104003906, 0.12244415283203125, 0.12698936462402344, 0.13153457641601562, 0.1360797882080078, 0.140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 2.0, 4.0, 6.0, 8.0, 9.0, 9.0, 11.0, 13.0, 26.0, 28.0, 59.0, 95.0, 220.0, 234.0, 100.0, 45.0, 30.0, 20.0, 18.0, 9.0, 10.0, 5.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02569580078125, -0.02491927146911621, -0.024142742156982422, -0.023366212844848633, -0.022589683532714844, -0.021813154220581055, -0.021036624908447266, -0.020260095596313477, -0.019483566284179688, -0.0187070369720459, -0.01793050765991211, -0.01715397834777832, -0.01637744903564453, -0.015600919723510742, -0.014824390411376953, -0.014047861099243164, -0.013271331787109375, -0.012494802474975586, -0.011718273162841797, -0.010941743850708008, -0.010165214538574219, -0.00938868522644043, -0.00861215591430664, -0.007835626602172852, -0.0070590972900390625, -0.0062825679779052734, -0.005506038665771484, -0.004729509353637695, -0.003952980041503906, -0.003176450729370117, -0.002399921417236328, -0.001623392105102539, -0.00084686279296875, -7.033348083496094e-05, 0.0007061958312988281, 0.0014827251434326172, 0.0022592544555664062, 0.0030357837677001953, 0.0038123130798339844, 0.0045888423919677734, 0.0053653717041015625, 0.0061419010162353516, 0.006918430328369141, 0.00769495964050293, 0.008471488952636719, 0.009248018264770508, 0.010024547576904297, 0.010801076889038086, 0.011577606201171875, 0.012354135513305664, 0.013130664825439453, 0.013907194137573242, 0.014683723449707031, 0.01546025276184082, 0.01623678207397461, 0.0170133113861084, 0.017789840698242188, 0.018566370010375977, 0.019342899322509766, 0.020119428634643555, 0.020895957946777344, 0.021672487258911133, 0.022449016571044922, 0.02322554588317871, 0.0240020751953125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 13.0, 19.0, 44.0, 73.0, 126.0, 189.0, 209.0, 164.0, 83.0, 37.0, 25.0, 9.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.971868515014648, -8.785367965698242, -8.59886646270752, -8.412365913391113, -8.22586441040039, -8.039363861083984, -7.852862358093262, -7.666361331939697, -7.479860305786133, -7.293359279632568, -7.106858253479004, -6.9203572273254395, -6.733856201171875, -6.5473551750183105, -6.360854148864746, -6.174353122711182, -5.987852096557617, -5.801351070404053, -5.614850044250488, -5.428349018096924, -5.241847991943359, -5.055346965789795, -4.8688459396362305, -4.682344913482666, -4.49584436416626, -4.309343338012695, -4.122842311859131, -3.9363412857055664, -3.749840259552002, -3.5633392333984375, -3.376838207244873, -3.1903371810913086, -3.0038363933563232, -2.817335367202759, -2.6308343410491943, -2.44433331489563, -2.2578322887420654, -2.071331262588501, -1.884830355644226, -1.6983293294906616, -1.5118283033370972, -1.3253272771835327, -1.1388262510299683, -0.9523252844810486, -0.7658242583274841, -0.5793232321739197, -0.392822265625, -0.20632123947143555, -0.019820213317871094, 0.16668079793453217, 0.3531818091869354, 0.5396828055381775, 0.7261838316917419, 0.9126848578453064, 1.099185824394226, 1.2856868505477905, 1.472187876701355, 1.6586889028549194, 1.8451899290084839, 2.031690835952759, 2.2181918621063232, 2.4046928882598877, 2.591193914413452, 2.7776949405670166, 2.964195966720581]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 2.0, 4.0, 6.0, 6.0, 8.0, 15.0, 25.0, 14.0, 30.0, 30.0, 30.0, 48.0, 48.0, 43.0, 54.0, 58.0, 53.0, 70.0, 64.0, 59.0, 65.0, 57.0, 39.0, 33.0, 25.0, 26.0, 30.0, 14.0, 12.0, 10.0, 3.0, 7.0, 3.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5932490825653076, -2.5170950889587402, -2.440941095352173, -2.3647871017456055, -2.288633108139038, -2.2124791145324707, -2.1363251209259033, -2.060171127319336, -1.9840171337127686, -1.9078631401062012, -1.8317091464996338, -1.7555551528930664, -1.679401159286499, -1.6032471656799316, -1.5270931720733643, -1.4509391784667969, -1.374785304069519, -1.2986313104629517, -1.2224773168563843, -1.146323323249817, -1.0701693296432495, -0.9940153360366821, -0.9178614020347595, -0.8417074084281921, -0.7655534148216248, -0.6893994212150574, -0.61324542760849, -0.5370914936065674, -0.4609374701976776, -0.38478347659111023, -0.30862951278686523, -0.23247551918029785, -0.15632152557373047, -0.08016753941774368, -0.004013553261756897, 0.07214042544364929, 0.14829441905021667, 0.22444841265678406, 0.30060237646102905, 0.37675637006759644, 0.4529103636741638, 0.5290643572807312, 0.6052183508872986, 0.6813722848892212, 0.7575262784957886, 0.833680272102356, 0.9098342657089233, 0.9859882593154907, 1.062142252922058, 1.1382962465286255, 1.2144502401351929, 1.2906042337417603, 1.3667582273483276, 1.442912220954895, 1.5190660953521729, 1.5952200889587402, 1.6713740825653076, 1.747528076171875, 1.8236820697784424, 1.8998360633850098, 1.9759900569915771, 2.0521440505981445, 2.128298044204712, 2.2044520378112793, 2.2806060314178467]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 12.0, 9.0, 15.0, 25.0, 27.0, 67.0, 245.0, 886.0, 4543.0, 41208.0, 823710.0, 164360.0, 10968.0, 1777.0, 416.0, 150.0, 42.0, 28.0, 16.0, 7.0, 6.0, 8.0, 3.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.203125, -7.01708984375, -6.8310546875, -6.64501953125, -6.458984375, -6.27294921875, -6.0869140625, -5.90087890625, -5.71484375, -5.52880859375, -5.3427734375, -5.15673828125, -4.970703125, -4.78466796875, -4.5986328125, -4.41259765625, -4.2265625, -4.04052734375, -3.8544921875, -3.66845703125, -3.482421875, -3.29638671875, -3.1103515625, -2.92431640625, -2.73828125, -2.55224609375, -2.3662109375, -2.18017578125, -1.994140625, -1.80810546875, -1.6220703125, -1.43603515625, -1.25, -1.06396484375, -0.8779296875, -0.69189453125, -0.505859375, -0.31982421875, -0.1337890625, 0.05224609375, 0.23828125, 0.42431640625, 0.6103515625, 0.79638671875, 0.982421875, 1.16845703125, 1.3544921875, 1.54052734375, 1.7265625, 1.91259765625, 2.0986328125, 2.28466796875, 2.470703125, 2.65673828125, 2.8427734375, 3.02880859375, 3.21484375, 3.40087890625, 3.5869140625, 3.77294921875, 3.958984375, 4.14501953125, 4.3310546875, 4.51708984375, 4.703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 9.0, 8.0, 13.0, 12.0, 14.0, 29.0, 21.0, 42.0, 27.0, 56.0, 31.0, 53.0, 62.0, 52.0, 76.0, 59.0, 57.0, 62.0, 64.0, 43.0, 37.0, 36.0, 29.0, 19.0, 20.0, 13.0, 12.0, 6.0, 5.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.1171875, -4.97259521484375, -4.8280029296875, -4.68341064453125, -4.538818359375, -4.39422607421875, -4.2496337890625, -4.10504150390625, -3.96044921875, -3.81585693359375, -3.6712646484375, -3.52667236328125, -3.382080078125, -3.23748779296875, -3.0928955078125, -2.94830322265625, -2.8037109375, -2.65911865234375, -2.5145263671875, -2.36993408203125, -2.225341796875, -2.08074951171875, -1.9361572265625, -1.79156494140625, -1.64697265625, -1.50238037109375, -1.3577880859375, -1.21319580078125, -1.068603515625, -0.92401123046875, -0.7794189453125, -0.63482666015625, -0.490234375, -0.34564208984375, -0.2010498046875, -0.05645751953125, 0.088134765625, 0.23272705078125, 0.3773193359375, 0.52191162109375, 0.66650390625, 0.81109619140625, 0.9556884765625, 1.10028076171875, 1.244873046875, 1.38946533203125, 1.5340576171875, 1.67864990234375, 1.8232421875, 1.96783447265625, 2.1124267578125, 2.25701904296875, 2.401611328125, 2.54620361328125, 2.6907958984375, 2.83538818359375, 2.97998046875, 3.12457275390625, 3.2691650390625, 3.41375732421875, 3.558349609375, 3.70294189453125, 3.8475341796875, 3.99212646484375, 4.13671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 2.0, 5.0, 13.0, 8.0, 9.0, 19.0, 13.0, 11.0, 20.0, 18.0, 29.0, 34.0, 40.0, 38.0, 74.0, 96.0, 149.0, 253.0, 591.0, 1599.0, 5227.0, 29673.0, 513612.0, 461795.0, 27605.0, 4931.0, 1359.0, 508.0, 241.0, 156.0, 111.0, 59.0, 40.0, 33.0, 29.0, 27.0, 22.0, 13.0, 12.0, 13.0, 10.0, 14.0, 9.0, 6.0, 3.0, 2.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0], "bins": [-4.484375, -4.3524169921875, -4.220458984375, -4.0885009765625, -3.95654296875, -3.8245849609375, -3.692626953125, -3.5606689453125, -3.4287109375, -3.2967529296875, -3.164794921875, -3.0328369140625, -2.90087890625, -2.7689208984375, -2.636962890625, -2.5050048828125, -2.373046875, -2.2410888671875, -2.109130859375, -1.9771728515625, -1.84521484375, -1.7132568359375, -1.581298828125, -1.4493408203125, -1.3173828125, -1.1854248046875, -1.053466796875, -0.9215087890625, -0.78955078125, -0.6575927734375, -0.525634765625, -0.3936767578125, -0.26171875, -0.1297607421875, 0.002197265625, 0.1341552734375, 0.26611328125, 0.3980712890625, 0.530029296875, 0.6619873046875, 0.7939453125, 0.9259033203125, 1.057861328125, 1.1898193359375, 1.32177734375, 1.4537353515625, 1.585693359375, 1.7176513671875, 1.849609375, 1.9815673828125, 2.113525390625, 2.2454833984375, 2.37744140625, 2.5093994140625, 2.641357421875, 2.7733154296875, 2.9052734375, 3.0372314453125, 3.169189453125, 3.3011474609375, 3.43310546875, 3.5650634765625, 3.697021484375, 3.8289794921875, 3.9609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 7.0, 10.0, 15.0, 20.0, 12.0, 14.0, 13.0, 10.0, 23.0, 26.0, 25.0, 34.0, 32.0, 26.0, 54.0, 32.0, 36.0, 39.0, 47.0, 41.0, 42.0, 38.0, 45.0, 36.0, 31.0, 28.0, 39.0, 31.0, 18.0, 25.0, 18.0, 15.0, 16.0, 17.0, 12.0, 14.0, 12.0, 11.0, 9.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 6.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.00390625, -3.88287353515625, -3.7618408203125, -3.64080810546875, -3.519775390625, -3.39874267578125, -3.2777099609375, -3.15667724609375, -3.03564453125, -2.91461181640625, -2.7935791015625, -2.67254638671875, -2.551513671875, -2.43048095703125, -2.3094482421875, -2.18841552734375, -2.0673828125, -1.94635009765625, -1.8253173828125, -1.70428466796875, -1.583251953125, -1.46221923828125, -1.3411865234375, -1.22015380859375, -1.09912109375, -0.97808837890625, -0.8570556640625, -0.73602294921875, -0.614990234375, -0.49395751953125, -0.3729248046875, -0.25189208984375, -0.130859375, -0.00982666015625, 0.1112060546875, 0.23223876953125, 0.353271484375, 0.47430419921875, 0.5953369140625, 0.71636962890625, 0.83740234375, 0.95843505859375, 1.0794677734375, 1.20050048828125, 1.321533203125, 1.44256591796875, 1.5635986328125, 1.68463134765625, 1.8056640625, 1.92669677734375, 2.0477294921875, 2.16876220703125, 2.289794921875, 2.41082763671875, 2.5318603515625, 2.65289306640625, 2.77392578125, 2.89495849609375, 3.0159912109375, 3.13702392578125, 3.258056640625, 3.37908935546875, 3.5001220703125, 3.62115478515625, 3.7421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 5.0, 7.0, 7.0, 18.0, 17.0, 19.0, 35.0, 73.0, 101.0, 116.0, 212.0, 413.0, 705.0, 1459.0, 3389.0, 9018.0, 30114.0, 134329.0, 589162.0, 214584.0, 44496.0, 12171.0, 4257.0, 1801.0, 901.0, 442.0, 252.0, 145.0, 111.0, 61.0, 39.0, 28.0, 18.0, 13.0, 7.0, 5.0, 2.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.861328125, -0.8349380493164062, -0.8085479736328125, -0.7821578979492188, -0.755767822265625, -0.7293777465820312, -0.7029876708984375, -0.6765975952148438, -0.65020751953125, -0.6238174438476562, -0.5974273681640625, -0.5710372924804688, -0.544647216796875, -0.5182571411132812, -0.4918670654296875, -0.46547698974609375, -0.4390869140625, -0.41269683837890625, -0.3863067626953125, -0.35991668701171875, -0.333526611328125, -0.30713653564453125, -0.2807464599609375, -0.25435638427734375, -0.22796630859375, -0.20157623291015625, -0.1751861572265625, -0.14879608154296875, -0.122406005859375, -0.09601593017578125, -0.0696258544921875, -0.04323577880859375, -0.016845703125, 0.00954437255859375, 0.0359344482421875, 0.06232452392578125, 0.088714599609375, 0.11510467529296875, 0.1414947509765625, 0.16788482666015625, 0.19427490234375, 0.22066497802734375, 0.2470550537109375, 0.27344512939453125, 0.299835205078125, 0.32622528076171875, 0.3526153564453125, 0.37900543212890625, 0.4053955078125, 0.43178558349609375, 0.4581756591796875, 0.48456573486328125, 0.510955810546875, 0.5373458862304688, 0.5637359619140625, 0.5901260375976562, 0.61651611328125, 0.6429061889648438, 0.6692962646484375, 0.6956863403320312, 0.722076416015625, 0.7484664916992188, 0.7748565673828125, 0.8012466430664062, 0.82763671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 10.0, 8.0, 9.0, 8.0, 12.0, 23.0, 32.0, 25.0, 45.0, 51.0, 76.0, 84.0, 123.0, 109.0, 96.0, 65.0, 42.0, 45.0, 32.0, 20.0, 17.0, 11.0, 14.0, 9.0, 5.0, 3.0, 8.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00011426210403442383, -0.00011021923273801804, -0.00010617636144161224, -0.00010213349014520645, -9.809061884880066e-05, -9.404774755239487e-05, -9.000487625598907e-05, -8.596200495958328e-05, -8.191913366317749e-05, -7.78762623667717e-05, -7.38333910703659e-05, -6.979051977396011e-05, -6.574764847755432e-05, -6.170477718114853e-05, -5.766190588474274e-05, -5.3619034588336945e-05, -4.957616329193115e-05, -4.553329199552536e-05, -4.149042069911957e-05, -3.7447549402713776e-05, -3.3404678106307983e-05, -2.936180680990219e-05, -2.53189355134964e-05, -2.1276064217090607e-05, -1.7233192920684814e-05, -1.3190321624279022e-05, -9.14745032787323e-06, -5.104579031467438e-06, -1.0617077350616455e-06, 2.9811635613441467e-06, 7.024034857749939e-06, 1.1066906154155731e-05, 1.5109777450561523e-05, 1.9152648746967316e-05, 2.3195520043373108e-05, 2.72383913397789e-05, 3.128126263618469e-05, 3.5324133932590485e-05, 3.936700522899628e-05, 4.340987652540207e-05, 4.745274782180786e-05, 5.1495619118213654e-05, 5.5538490414619446e-05, 5.958136171102524e-05, 6.362423300743103e-05, 6.766710430383682e-05, 7.170997560024261e-05, 7.575284689664841e-05, 7.97957181930542e-05, 8.383858948945999e-05, 8.788146078586578e-05, 9.192433208227158e-05, 9.596720337867737e-05, 0.00010001007467508316, 0.00010405294597148895, 0.00010809581726789474, 0.00011213868856430054, 0.00011618155986070633, 0.00012022443115711212, 0.00012426730245351791, 0.0001283101737499237, 0.0001323530450463295, 0.0001363959163427353, 0.00014043878763914108, 0.00014448165893554688]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 9.0, 17.0, 23.0, 36.0, 41.0, 67.0, 100.0, 165.0, 266.0, 460.0, 865.0, 1846.0, 4270.0, 11876.0, 46039.0, 269260.0, 584640.0, 95962.0, 20778.0, 6414.0, 2636.0, 1216.0, 558.0, 351.0, 229.0, 134.0, 89.0, 46.0, 45.0, 28.0, 14.0, 9.0, 10.0, 6.0, 3.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.0546875, -1.0229415893554688, -0.9911956787109375, -0.9594497680664062, -0.927703857421875, -0.8959579467773438, -0.8642120361328125, -0.8324661254882812, -0.80072021484375, -0.7689743041992188, -0.7372283935546875, -0.7054824829101562, -0.673736572265625, -0.6419906616210938, -0.6102447509765625, -0.5784988403320312, -0.5467529296875, -0.5150070190429688, -0.4832611083984375, -0.45151519775390625, -0.419769287109375, -0.38802337646484375, -0.3562774658203125, -0.32453155517578125, -0.29278564453125, -0.26103973388671875, -0.2292938232421875, -0.19754791259765625, -0.165802001953125, -0.13405609130859375, -0.1023101806640625, -0.07056427001953125, -0.038818359375, -0.00707244873046875, 0.0246734619140625, 0.05641937255859375, 0.088165283203125, 0.11991119384765625, 0.1516571044921875, 0.18340301513671875, 0.21514892578125, 0.24689483642578125, 0.2786407470703125, 0.31038665771484375, 0.342132568359375, 0.37387847900390625, 0.4056243896484375, 0.43737030029296875, 0.4691162109375, 0.5008621215820312, 0.5326080322265625, 0.5643539428710938, 0.596099853515625, 0.6278457641601562, 0.6595916748046875, 0.6913375854492188, 0.72308349609375, 0.7548294067382812, 0.7865753173828125, 0.8183212280273438, 0.850067138671875, 0.8818130493164062, 0.9135589599609375, 0.9453048706054688, 0.97705078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 1.0, 2.0, 3.0, 7.0, 9.0, 2.0, 16.0, 13.0, 17.0, 23.0, 21.0, 27.0, 43.0, 38.0, 65.0, 81.0, 101.0, 97.0, 91.0, 61.0, 43.0, 51.0, 32.0, 28.0, 13.0, 24.0, 31.0, 13.0, 8.0, 7.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.386474609375, -0.37456512451171875, -0.3626556396484375, -0.35074615478515625, -0.338836669921875, -0.32692718505859375, -0.3150177001953125, -0.30310821533203125, -0.29119873046875, -0.27928924560546875, -0.2673797607421875, -0.25547027587890625, -0.243560791015625, -0.23165130615234375, -0.2197418212890625, -0.20783233642578125, -0.1959228515625, -0.18401336669921875, -0.1721038818359375, -0.16019439697265625, -0.148284912109375, -0.13637542724609375, -0.1244659423828125, -0.11255645751953125, -0.10064697265625, -0.08873748779296875, -0.0768280029296875, -0.06491851806640625, -0.053009033203125, -0.04109954833984375, -0.0291900634765625, -0.01728057861328125, -0.00537109375, 0.00653839111328125, 0.0184478759765625, 0.03035736083984375, 0.042266845703125, 0.05417633056640625, 0.0660858154296875, 0.07799530029296875, 0.08990478515625, 0.10181427001953125, 0.1137237548828125, 0.12563323974609375, 0.137542724609375, 0.14945220947265625, 0.1613616943359375, 0.17327117919921875, 0.1851806640625, 0.19709014892578125, 0.2089996337890625, 0.22090911865234375, 0.232818603515625, 0.24472808837890625, 0.2566375732421875, 0.26854705810546875, 0.28045654296875, 0.29236602783203125, 0.3042755126953125, 0.31618499755859375, 0.328094482421875, 0.34000396728515625, 0.3519134521484375, 0.36382293701171875, 0.375732421875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 11.0, 56.0, 179.0, 391.0, 271.0, 77.0, 18.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.14911651611328, -37.380836486816406, -36.6125602722168, -35.84428024291992, -35.07600402832031, -34.30772399902344, -33.53944396972656, -32.77116775512695, -32.00288772583008, -31.234609603881836, -30.466331481933594, -29.69805145263672, -28.929773330688477, -28.161495208740234, -27.39321517944336, -26.624937057495117, -25.856658935546875, -25.088380813598633, -24.32010269165039, -23.551822662353516, -22.783544540405273, -22.01526641845703, -21.246986389160156, -20.478708267211914, -19.710430145263672, -18.94215202331543, -18.173873901367188, -17.405593872070312, -16.63731575012207, -15.869037628173828, -15.10075855255127, -14.332479476928711, -13.564202308654785, -12.795923233032227, -12.027645111083984, -11.259366989135742, -10.491087913513184, -9.722808837890625, -8.954530715942383, -8.18625259399414, -7.417973518371582, -6.649694919586182, -5.881416320800781, -5.113137722015381, -4.3448591232299805, -3.57658052444458, -2.8083019256591797, -2.0400233268737793, -1.271744728088379, -0.5034661293029785, 0.2648124694824219, 1.0330910682678223, 1.8013696670532227, 2.569648265838623, 3.3379268646240234, 4.106205463409424, 4.874484062194824, 5.642762660980225, 6.411041259765625, 7.179319858551025, 7.947598457336426, 8.715877532958984, 9.484155654907227, 10.252433776855469, 11.020712852478027]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 3.0, 7.0, 7.0, 13.0, 12.0, 10.0, 10.0, 18.0, 21.0, 13.0, 22.0, 23.0, 32.0, 26.0, 19.0, 31.0, 43.0, 38.0, 47.0, 40.0, 37.0, 34.0, 36.0, 41.0, 32.0, 41.0, 37.0, 27.0, 32.0, 34.0, 29.0, 28.0, 16.0, 25.0, 20.0, 15.0, 12.0, 14.0, 6.0, 13.0, 7.0, 6.0, 5.0, 7.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.737830638885498, -5.536037445068359, -5.334244251251221, -5.132451057434082, -4.930657863616943, -4.728864669799805, -4.527071475982666, -4.325278282165527, -4.123485088348389, -3.92169189453125, -3.7198987007141113, -3.5181055068969727, -3.316312313079834, -3.1145191192626953, -2.9127259254455566, -2.710932731628418, -2.5091395378112793, -2.3073463439941406, -2.105553150177002, -1.9037599563598633, -1.7019667625427246, -1.500173568725586, -1.2983803749084473, -1.0965871810913086, -0.8947939872741699, -0.6930007934570312, -0.4912075996398926, -0.2894144058227539, -0.08762121200561523, 0.11417198181152344, 0.3159651756286621, 0.5177583694458008, 0.7195510864257812, 0.9213442802429199, 1.1231374740600586, 1.3249306678771973, 1.526723861694336, 1.7285170555114746, 1.9303102493286133, 2.132103443145752, 2.3338966369628906, 2.5356898307800293, 2.737483024597168, 2.9392762184143066, 3.1410694122314453, 3.342862606048584, 3.5446557998657227, 3.7464489936828613, 3.9482421875, 4.150035381317139, 4.351828575134277, 4.553621768951416, 4.755414962768555, 4.957208156585693, 5.159001350402832, 5.360794544219971, 5.562587738037109, 5.764380931854248, 5.966174125671387, 6.167967319488525, 6.369760513305664, 6.571553707122803, 6.773346900939941, 6.97514009475708, 7.176933288574219]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 12.0, 14.0, 36.0, 72.0, 159.0, 382.0, 1008.0, 2868.0, 11131.0, 70393.0, 1254221.0, 2656404.0, 172452.0, 18496.0, 4277.0, 1389.0, 532.0, 212.0, 93.0, 50.0, 23.0, 13.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41796875, -5.2384033203125, -5.058837890625, -4.8792724609375, -4.69970703125, -4.5201416015625, -4.340576171875, -4.1610107421875, -3.9814453125, -3.8018798828125, -3.622314453125, -3.4427490234375, -3.26318359375, -3.0836181640625, -2.904052734375, -2.7244873046875, -2.544921875, -2.3653564453125, -2.185791015625, -2.0062255859375, -1.82666015625, -1.6470947265625, -1.467529296875, -1.2879638671875, -1.1083984375, -0.9288330078125, -0.749267578125, -0.5697021484375, -0.39013671875, -0.2105712890625, -0.031005859375, 0.1485595703125, 0.328125, 0.5076904296875, 0.687255859375, 0.8668212890625, 1.04638671875, 1.2259521484375, 1.405517578125, 1.5850830078125, 1.7646484375, 1.9442138671875, 2.123779296875, 2.3033447265625, 2.48291015625, 2.6624755859375, 2.842041015625, 3.0216064453125, 3.201171875, 3.3807373046875, 3.560302734375, 3.7398681640625, 3.91943359375, 4.0989990234375, 4.278564453125, 4.4581298828125, 4.6376953125, 4.8172607421875, 4.996826171875, 5.1763916015625, 5.35595703125, 5.5355224609375, 5.715087890625, 5.8946533203125, 6.07421875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 9.0, 4.0, 10.0, 21.0, 18.0, 16.0, 27.0, 28.0, 30.0, 37.0, 38.0, 50.0, 41.0, 52.0, 53.0, 62.0, 50.0, 73.0, 56.0, 48.0, 49.0, 33.0, 39.0, 31.0, 21.0, 16.0, 19.0, 14.0, 11.0, 10.0, 8.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.025390625, -2.929840087890625, -2.83428955078125, -2.738739013671875, -2.6431884765625, -2.547637939453125, -2.45208740234375, -2.356536865234375, -2.260986328125, -2.165435791015625, -2.06988525390625, -1.974334716796875, -1.8787841796875, -1.783233642578125, -1.68768310546875, -1.592132568359375, -1.49658203125, -1.401031494140625, -1.30548095703125, -1.209930419921875, -1.1143798828125, -1.018829345703125, -0.92327880859375, -0.827728271484375, -0.732177734375, -0.636627197265625, -0.54107666015625, -0.445526123046875, -0.3499755859375, -0.254425048828125, -0.15887451171875, -0.063323974609375, 0.0322265625, 0.127777099609375, 0.22332763671875, 0.318878173828125, 0.4144287109375, 0.509979248046875, 0.60552978515625, 0.701080322265625, 0.796630859375, 0.892181396484375, 0.98773193359375, 1.083282470703125, 1.1788330078125, 1.274383544921875, 1.36993408203125, 1.465484619140625, 1.56103515625, 1.656585693359375, 1.75213623046875, 1.847686767578125, 1.9432373046875, 2.038787841796875, 2.13433837890625, 2.229888916015625, 2.325439453125, 2.420989990234375, 2.51654052734375, 2.612091064453125, 2.7076416015625, 2.803192138671875, 2.89874267578125, 2.994293212890625, 3.08984375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 1.0, 2.0, 7.0, 12.0, 10.0, 12.0, 12.0, 32.0, 39.0, 55.0, 82.0, 124.0, 225.0, 377.0, 704.0, 1601.0, 4532.0, 16883.0, 106184.0, 2784890.0, 1196700.0, 63944.0, 11753.0, 3387.0, 1260.0, 587.0, 324.0, 175.0, 93.0, 72.0, 59.0, 30.0, 31.0, 22.0, 11.0, 10.0, 7.0, 9.0, 3.0, 5.0, 1.0, 1.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-4.9609375, -4.81005859375, -4.6591796875, -4.50830078125, -4.357421875, -4.20654296875, -4.0556640625, -3.90478515625, -3.75390625, -3.60302734375, -3.4521484375, -3.30126953125, -3.150390625, -2.99951171875, -2.8486328125, -2.69775390625, -2.546875, -2.39599609375, -2.2451171875, -2.09423828125, -1.943359375, -1.79248046875, -1.6416015625, -1.49072265625, -1.33984375, -1.18896484375, -1.0380859375, -0.88720703125, -0.736328125, -0.58544921875, -0.4345703125, -0.28369140625, -0.1328125, 0.01806640625, 0.1689453125, 0.31982421875, 0.470703125, 0.62158203125, 0.7724609375, 0.92333984375, 1.07421875, 1.22509765625, 1.3759765625, 1.52685546875, 1.677734375, 1.82861328125, 1.9794921875, 2.13037109375, 2.28125, 2.43212890625, 2.5830078125, 2.73388671875, 2.884765625, 3.03564453125, 3.1865234375, 3.33740234375, 3.48828125, 3.63916015625, 3.7900390625, 3.94091796875, 4.091796875, 4.24267578125, 4.3935546875, 4.54443359375, 4.6953125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 8.0, 12.0, 14.0, 18.0, 32.0, 35.0, 62.0, 91.0, 145.0, 255.0, 417.0, 700.0, 755.0, 606.0, 342.0, 223.0, 112.0, 74.0, 55.0, 39.0, 17.0, 22.0, 11.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2314453125, -1.184539794921875, -1.13763427734375, -1.090728759765625, -1.0438232421875, -0.996917724609375, -0.95001220703125, -0.903106689453125, -0.856201171875, -0.809295654296875, -0.76239013671875, -0.715484619140625, -0.6685791015625, -0.621673583984375, -0.57476806640625, -0.527862548828125, -0.48095703125, -0.434051513671875, -0.38714599609375, -0.340240478515625, -0.2933349609375, -0.246429443359375, -0.19952392578125, -0.152618408203125, -0.105712890625, -0.058807373046875, -0.01190185546875, 0.035003662109375, 0.0819091796875, 0.128814697265625, 0.17572021484375, 0.222625732421875, 0.26953125, 0.316436767578125, 0.36334228515625, 0.410247802734375, 0.4571533203125, 0.504058837890625, 0.55096435546875, 0.597869873046875, 0.644775390625, 0.691680908203125, 0.73858642578125, 0.785491943359375, 0.8323974609375, 0.879302978515625, 0.92620849609375, 0.973114013671875, 1.02001953125, 1.066925048828125, 1.11383056640625, 1.160736083984375, 1.2076416015625, 1.254547119140625, 1.30145263671875, 1.348358154296875, 1.395263671875, 1.442169189453125, 1.48907470703125, 1.535980224609375, 1.5828857421875, 1.629791259765625, 1.67669677734375, 1.723602294921875, 1.7705078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 8.0, 17.0, 23.0, 33.0, 50.0, 81.0, 70.0, 106.0, 114.0, 96.0, 110.0, 68.0, 65.0, 46.0, 39.0, 17.0, 18.0, 13.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.17844820022583, -7.004284858703613, -6.8301215171813965, -6.655958652496338, -6.481795310974121, -6.307631969451904, -6.1334686279296875, -5.959305763244629, -5.785142421722412, -5.610979080200195, -5.4368157386779785, -5.26265287399292, -5.088489532470703, -4.914326190948486, -4.7401628494262695, -4.565999984741211, -4.391836166381836, -4.217672824859619, -4.043509483337402, -3.8693463802337646, -3.695183277130127, -3.52101993560791, -3.3468565940856934, -3.1726934909820557, -2.998530387878418, -2.824367046356201, -2.6502039432525635, -2.4760406017303467, -2.301877498626709, -2.127714157104492, -1.953550934791565, -1.7793877124786377, -1.605224609375, -1.4310613870620728, -1.2568981647491455, -1.0827348232269287, -0.9085716605186462, -0.734408438205719, -0.560245156288147, -0.3860819339752197, -0.21191871166229248, -0.03775547444820404, 0.1364077627658844, 0.31057101488113403, 0.4847342371940613, 0.6588974595069885, 0.8330607414245605, 1.0072239637374878, 1.181387186050415, 1.3555504083633423, 1.5297136306762695, 1.7038769721984863, 1.878040075302124, 2.052203416824341, 2.2263665199279785, 2.4005298614501953, 2.574693202972412, 2.748856544494629, 2.9230196475982666, 3.0971829891204834, 3.271346092224121, 3.445509433746338, 3.6196727752685547, 3.7938358783721924, 3.96799898147583]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 3.0, 9.0, 9.0, 9.0, 9.0, 18.0, 13.0, 24.0, 20.0, 16.0, 27.0, 38.0, 25.0, 37.0, 46.0, 35.0, 43.0, 43.0, 48.0, 52.0, 56.0, 35.0, 42.0, 34.0, 37.0, 41.0, 30.0, 34.0, 24.0, 17.0, 26.0, 20.0, 12.0, 9.0, 14.0, 7.0, 10.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.608947277069092, -2.521838426589966, -2.43472957611084, -2.347620964050293, -2.260512113571167, -2.173403263092041, -2.086294651031494, -1.9991858005523682, -1.9120769500732422, -1.8249680995941162, -1.7378593683242798, -1.6507506370544434, -1.5636417865753174, -1.4765329360961914, -1.389424204826355, -1.3023154735565186, -1.2152066230773926, -1.1280977725982666, -1.0409890413284302, -0.953880250453949, -0.8667714595794678, -0.7796626687049866, -0.6925538778305054, -0.6054450869560242, -0.518336296081543, -0.43122750520706177, -0.34411871433258057, -0.25700992345809937, -0.16990113258361816, -0.08279234170913696, 0.004316449165344238, 0.09142524003982544, 0.17853403091430664, 0.26564282178878784, 0.35275161266326904, 0.43986040353775024, 0.5269691944122314, 0.6140779852867126, 0.7011867761611938, 0.788295567035675, 0.8754043579101562, 0.9625131487846375, 1.0496219396591187, 1.136730670928955, 1.223839521408081, 1.310948371887207, 1.3980571031570435, 1.4851658344268799, 1.5722746849060059, 1.6593835353851318, 1.7464922666549683, 1.8336009979248047, 1.9207098484039307, 2.0078186988830566, 2.0949273109436035, 2.1820361614227295, 2.2691450119018555, 2.3562538623809814, 2.4433627128601074, 2.5304713249206543, 2.6175801753997803, 2.7046890258789062, 2.791797637939453, 2.878906488418579, 2.966015338897705]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 15.0, 20.0, 26.0, 36.0, 65.0, 73.0, 106.0, 179.0, 266.0, 481.0, 787.0, 1476.0, 2667.0, 5639.0, 12049.0, 28421.0, 77796.0, 260697.0, 432261.0, 142762.0, 47314.0, 18484.0, 8166.0, 3934.0, 2012.0, 1128.0, 613.0, 383.0, 215.0, 163.0, 92.0, 67.0, 46.0, 27.0, 16.0, 18.0, 11.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3896484375, -0.3779335021972656, -0.36621856689453125, -0.3545036315917969, -0.3427886962890625, -0.3310737609863281, -0.31935882568359375, -0.3076438903808594, -0.295928955078125, -0.2842140197753906, -0.27249908447265625, -0.2607841491699219, -0.2490692138671875, -0.23735427856445312, -0.22563934326171875, -0.21392440795898438, -0.20220947265625, -0.19049453735351562, -0.17877960205078125, -0.16706466674804688, -0.1553497314453125, -0.14363479614257812, -0.13191986083984375, -0.12020492553710938, -0.108489990234375, -0.09677505493164062, -0.08506011962890625, -0.07334518432617188, -0.0616302490234375, -0.049915313720703125, -0.03820037841796875, -0.026485443115234375, -0.0147705078125, -0.003055572509765625, 0.00865936279296875, 0.020374298095703125, 0.0320892333984375, 0.043804168701171875, 0.05551910400390625, 0.06723403930664062, 0.078948974609375, 0.09066390991210938, 0.10237884521484375, 0.11409378051757812, 0.1258087158203125, 0.13752365112304688, 0.14923858642578125, 0.16095352172851562, 0.17266845703125, 0.18438339233398438, 0.19609832763671875, 0.20781326293945312, 0.2195281982421875, 0.23124313354492188, 0.24295806884765625, 0.2546730041503906, 0.266387939453125, 0.2781028747558594, 0.28981781005859375, 0.3015327453613281, 0.3132476806640625, 0.3249626159667969, 0.33667755126953125, 0.3483924865722656, 0.360107421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 8.0, 6.0, 8.0, 10.0, 6.0, 7.0, 12.0, 25.0, 22.0, 25.0, 29.0, 46.0, 44.0, 37.0, 59.0, 54.0, 52.0, 59.0, 53.0, 59.0, 49.0, 38.0, 52.0, 44.0, 32.0, 32.0, 27.0, 24.0, 21.0, 16.0, 5.0, 14.0, 5.0, 15.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.892578125, -1.8271484375, -1.76171875, -1.6962890625, -1.630859375, -1.5654296875, -1.5, -1.4345703125, -1.369140625, -1.3037109375, -1.23828125, -1.1728515625, -1.107421875, -1.0419921875, -0.9765625, -0.9111328125, -0.845703125, -0.7802734375, -0.71484375, -0.6494140625, -0.583984375, -0.5185546875, -0.453125, -0.3876953125, -0.322265625, -0.2568359375, -0.19140625, -0.1259765625, -0.060546875, 0.0048828125, 0.0703125, 0.1357421875, 0.201171875, 0.2666015625, 0.33203125, 0.3974609375, 0.462890625, 0.5283203125, 0.59375, 0.6591796875, 0.724609375, 0.7900390625, 0.85546875, 0.9208984375, 0.986328125, 1.0517578125, 1.1171875, 1.1826171875, 1.248046875, 1.3134765625, 1.37890625, 1.4443359375, 1.509765625, 1.5751953125, 1.640625, 1.7060546875, 1.771484375, 1.8369140625, 1.90234375, 1.9677734375, 2.033203125, 2.0986328125, 2.1640625, 2.2294921875, 2.294921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 13.0, 16.0, 10.0, 33.0, 50.0, 58.0, 80.0, 125.0, 205.0, 288.0, 425.0, 727.0, 1161.0, 1914.0, 3177.0, 5585.0, 10424.0, 19951.0, 42359.0, 98319.0, 260895.0, 347696.0, 141050.0, 57486.0, 26293.0, 13086.0, 6991.0, 3994.0, 2300.0, 1393.0, 856.0, 512.0, 361.0, 225.0, 182.0, 99.0, 74.0, 33.0, 28.0, 22.0, 17.0, 11.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20947265625, -0.20229530334472656, -0.19511795043945312, -0.1879405975341797, -0.18076324462890625, -0.1735858917236328, -0.16640853881835938, -0.15923118591308594, -0.1520538330078125, -0.14487648010253906, -0.13769912719726562, -0.1305217742919922, -0.12334442138671875, -0.11616706848144531, -0.10898971557617188, -0.10181236267089844, -0.094635009765625, -0.08745765686035156, -0.08028030395507812, -0.07310295104980469, -0.06592559814453125, -0.05874824523925781, -0.051570892333984375, -0.04439353942871094, -0.0372161865234375, -0.030038833618164062, -0.022861480712890625, -0.015684127807617188, -0.00850677490234375, -0.0013294219970703125, 0.005847930908203125, 0.013025283813476562, 0.02020263671875, 0.027379989624023438, 0.034557342529296875, 0.04173469543457031, 0.04891204833984375, 0.05608940124511719, 0.06326675415039062, 0.07044410705566406, 0.0776214599609375, 0.08479881286621094, 0.09197616577148438, 0.09915351867675781, 0.10633087158203125, 0.11350822448730469, 0.12068557739257812, 0.12786293029785156, 0.135040283203125, 0.14221763610839844, 0.14939498901367188, 0.1565723419189453, 0.16374969482421875, 0.1709270477294922, 0.17810440063476562, 0.18528175354003906, 0.1924591064453125, 0.19963645935058594, 0.20681381225585938, 0.2139911651611328, 0.22116851806640625, 0.2283458709716797, 0.23552322387695312, 0.24270057678222656, 0.2498779296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 4.0, 5.0, 7.0, 12.0, 15.0, 14.0, 20.0, 23.0, 27.0, 32.0, 32.0, 34.0, 45.0, 37.0, 49.0, 62.0, 55.0, 57.0, 46.0, 54.0, 42.0, 46.0, 43.0, 29.0, 31.0, 29.0, 23.0, 18.0, 16.0, 18.0, 15.0, 5.0, 13.0, 7.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.650390625, -3.530548095703125, -3.41070556640625, -3.290863037109375, -3.1710205078125, -3.051177978515625, -2.93133544921875, -2.811492919921875, -2.691650390625, -2.571807861328125, -2.45196533203125, -2.332122802734375, -2.2122802734375, -2.092437744140625, -1.97259521484375, -1.852752685546875, -1.73291015625, -1.613067626953125, -1.49322509765625, -1.373382568359375, -1.2535400390625, -1.133697509765625, -1.01385498046875, -0.894012451171875, -0.774169921875, -0.654327392578125, -0.53448486328125, -0.414642333984375, -0.2947998046875, -0.174957275390625, -0.05511474609375, 0.064727783203125, 0.1845703125, 0.304412841796875, 0.42425537109375, 0.544097900390625, 0.6639404296875, 0.783782958984375, 0.90362548828125, 1.023468017578125, 1.143310546875, 1.263153076171875, 1.38299560546875, 1.502838134765625, 1.6226806640625, 1.742523193359375, 1.86236572265625, 1.982208251953125, 2.10205078125, 2.221893310546875, 2.34173583984375, 2.461578369140625, 2.5814208984375, 2.701263427734375, 2.82110595703125, 2.940948486328125, 3.060791015625, 3.180633544921875, 3.30047607421875, 3.420318603515625, 3.5401611328125, 3.660003662109375, 3.77984619140625, 3.899688720703125, 4.01953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 8.0, 14.0, 6.0, 21.0, 30.0, 44.0, 59.0, 88.0, 147.0, 241.0, 555.0, 1476.0, 5406.0, 40945.0, 863995.0, 121194.0, 10620.0, 2267.0, 770.0, 305.0, 157.0, 67.0, 60.0, 33.0, 16.0, 6.0, 9.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0914306640625, -0.0887155532836914, -0.08600044250488281, -0.08328533172607422, -0.08057022094726562, -0.07785511016845703, -0.07513999938964844, -0.07242488861083984, -0.06970977783203125, -0.06699466705322266, -0.06427955627441406, -0.06156444549560547, -0.058849334716796875, -0.05613422393798828, -0.05341911315917969, -0.050704002380371094, -0.0479888916015625, -0.045273780822753906, -0.04255867004394531, -0.03984355926513672, -0.037128448486328125, -0.03441333770751953, -0.03169822692871094, -0.028983116149902344, -0.02626800537109375, -0.023552894592285156, -0.020837783813476562, -0.01812267303466797, -0.015407562255859375, -0.012692451477050781, -0.009977340698242188, -0.007262229919433594, -0.004547119140625, -0.0018320083618164062, 0.0008831024169921875, 0.0035982131958007812, 0.006313323974609375, 0.009028434753417969, 0.011743545532226562, 0.014458656311035156, 0.01717376708984375, 0.019888877868652344, 0.022603988647460938, 0.02531909942626953, 0.028034210205078125, 0.03074932098388672, 0.03346443176269531, 0.036179542541503906, 0.0388946533203125, 0.041609764099121094, 0.04432487487792969, 0.04703998565673828, 0.049755096435546875, 0.05247020721435547, 0.05518531799316406, 0.057900428771972656, 0.06061553955078125, 0.06333065032958984, 0.06604576110839844, 0.06876087188720703, 0.07147598266601562, 0.07419109344482422, 0.07690620422363281, 0.0796213150024414, 0.08233642578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 9.0, 7.0, 13.0, 16.0, 25.0, 37.0, 57.0, 78.0, 129.0, 141.0, 143.0, 117.0, 65.0, 51.0, 33.0, 18.0, 24.0, 12.0, 8.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8279762268066406e-05, -4.6897679567337036e-05, -4.5515596866607666e-05, -4.4133514165878296e-05, -4.2751431465148926e-05, -4.1369348764419556e-05, -3.9987266063690186e-05, -3.8605183362960815e-05, -3.7223100662231445e-05, -3.5841017961502075e-05, -3.4458935260772705e-05, -3.3076852560043335e-05, -3.1694769859313965e-05, -3.0312687158584595e-05, -2.8930604457855225e-05, -2.7548521757125854e-05, -2.6166439056396484e-05, -2.4784356355667114e-05, -2.3402273654937744e-05, -2.2020190954208374e-05, -2.0638108253479004e-05, -1.9256025552749634e-05, -1.7873942852020264e-05, -1.6491860151290894e-05, -1.5109777450561523e-05, -1.3727694749832153e-05, -1.2345612049102783e-05, -1.0963529348373413e-05, -9.581446647644043e-06, -8.199363946914673e-06, -6.817281246185303e-06, -5.435198545455933e-06, -4.0531158447265625e-06, -2.6710331439971924e-06, -1.2889504432678223e-06, 9.313225746154785e-08, 1.475214958190918e-06, 2.857297658920288e-06, 4.239380359649658e-06, 5.621463060379028e-06, 7.0035457611083984e-06, 8.385628461837769e-06, 9.767711162567139e-06, 1.1149793863296509e-05, 1.2531876564025879e-05, 1.3913959264755249e-05, 1.529604196548462e-05, 1.667812466621399e-05, 1.806020736694336e-05, 1.944229006767273e-05, 2.08243727684021e-05, 2.220645546913147e-05, 2.358853816986084e-05, 2.497062087059021e-05, 2.635270357131958e-05, 2.773478627204895e-05, 2.911686897277832e-05, 3.049895167350769e-05, 3.188103437423706e-05, 3.326311707496643e-05, 3.46451997756958e-05, 3.602728247642517e-05, 3.740936517715454e-05, 3.879144787788391e-05, 4.017353057861328e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 7.0, 12.0, 17.0, 23.0, 40.0, 80.0, 133.0, 284.0, 581.0, 1561.0, 5184.0, 26217.0, 429064.0, 546826.0, 30133.0, 5572.0, 1620.0, 629.0, 257.0, 128.0, 67.0, 43.0, 29.0, 14.0, 12.0, 5.0, 9.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.10931396484375, -0.10643959045410156, -0.10356521606445312, -0.10069084167480469, -0.09781646728515625, -0.09494209289550781, -0.09206771850585938, -0.08919334411621094, -0.0863189697265625, -0.08344459533691406, -0.08057022094726562, -0.07769584655761719, -0.07482147216796875, -0.07194709777832031, -0.06907272338867188, -0.06619834899902344, -0.063323974609375, -0.06044960021972656, -0.057575225830078125, -0.05470085144042969, -0.05182647705078125, -0.04895210266113281, -0.046077728271484375, -0.04320335388183594, -0.0403289794921875, -0.03745460510253906, -0.034580230712890625, -0.03170585632324219, -0.02883148193359375, -0.025957107543945312, -0.023082733154296875, -0.020208358764648438, -0.017333984375, -0.014459609985351562, -0.011585235595703125, -0.008710861206054688, -0.00583648681640625, -0.0029621124267578125, -8.7738037109375e-05, 0.0027866363525390625, 0.0056610107421875, 0.008535385131835938, 0.011409759521484375, 0.014284133911132812, 0.01715850830078125, 0.020032882690429688, 0.022907257080078125, 0.025781631469726562, 0.028656005859375, 0.03153038024902344, 0.034404754638671875, 0.03727912902832031, 0.04015350341796875, 0.04302787780761719, 0.045902252197265625, 0.04877662658691406, 0.0516510009765625, 0.05452537536621094, 0.057399749755859375, 0.06027412414550781, 0.06314849853515625, 0.06602287292480469, 0.06889724731445312, 0.07177162170410156, 0.07464599609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 8.0, 5.0, 14.0, 31.0, 62.0, 132.0, 294.0, 258.0, 92.0, 44.0, 23.0, 15.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03302001953125, -0.032169342041015625, -0.03131866455078125, -0.030467987060546875, -0.0296173095703125, -0.028766632080078125, -0.02791595458984375, -0.027065277099609375, -0.026214599609375, -0.025363922119140625, -0.02451324462890625, -0.023662567138671875, -0.0228118896484375, -0.021961212158203125, -0.02111053466796875, -0.020259857177734375, -0.0194091796875, -0.018558502197265625, -0.01770782470703125, -0.016857147216796875, -0.0160064697265625, -0.015155792236328125, -0.01430511474609375, -0.013454437255859375, -0.012603759765625, -0.011753082275390625, -0.01090240478515625, -0.010051727294921875, -0.0092010498046875, -0.008350372314453125, -0.00749969482421875, -0.006649017333984375, -0.00579833984375, -0.004947662353515625, -0.00409698486328125, -0.003246307373046875, -0.0023956298828125, -0.001544952392578125, -0.00069427490234375, 0.000156402587890625, 0.001007080078125, 0.001857757568359375, 0.00270843505859375, 0.003559112548828125, 0.0044097900390625, 0.005260467529296875, 0.00611114501953125, 0.006961822509765625, 0.0078125, 0.008663177490234375, 0.00951385498046875, 0.010364532470703125, 0.0112152099609375, 0.012065887451171875, 0.01291656494140625, 0.013767242431640625, 0.014617919921875, 0.015468597412109375, 0.01631927490234375, 0.017169952392578125, 0.0180206298828125, 0.018871307373046875, 0.01972198486328125, 0.020572662353515625, 0.02142333984375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 17.0, 46.0, 122.0, 205.0, 247.0, 187.0, 101.0, 41.0, 20.0, 9.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.502792358398438, -10.27670669555664, -10.050621032714844, -9.824535369873047, -9.59844970703125, -9.372364044189453, -9.146278381347656, -8.92019271850586, -8.694107055664062, -8.468021392822266, -8.241935729980469, -8.015850067138672, -7.789764404296875, -7.563678741455078, -7.337592601776123, -7.111506938934326, -6.885420799255371, -6.659335136413574, -6.433249473571777, -6.2071638107299805, -5.981078147888184, -5.754992485046387, -5.528906345367432, -5.302820682525635, -5.076735019683838, -4.850649356842041, -4.624563694000244, -4.398478031158447, -4.172391891479492, -3.9463064670562744, -3.7202205657958984, -3.4941349029541016, -3.2680487632751465, -3.0419631004333496, -2.8158774375915527, -2.5897915363311768, -2.36370587348938, -2.137620210647583, -1.9115344285964966, -1.6854486465454102, -1.4593629837036133, -1.2332773208618164, -1.00719153881073, -0.7811058163642883, -0.5550200939178467, -0.3289344310760498, -0.10284864902496338, 0.12323713302612305, 0.3493227958679199, 0.5754085183143616, 0.8014942407608032, 1.0275800228118896, 1.2536656856536865, 1.4797513484954834, 1.7058371305465698, 1.9319229125976562, 2.158008575439453, 2.38409423828125, 2.610179901123047, 2.836265802383423, 3.0623514652252197, 3.2884371280670166, 3.5145230293273926, 3.7406086921691895, 3.9666943550109863]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 4.0, 4.0, 10.0, 6.0, 18.0, 13.0, 15.0, 28.0, 16.0, 24.0, 25.0, 40.0, 36.0, 47.0, 43.0, 47.0, 45.0, 55.0, 56.0, 52.0, 45.0, 43.0, 40.0, 49.0, 29.0, 31.0, 32.0, 25.0, 24.0, 18.0, 10.0, 14.0, 11.0, 10.0, 5.0, 5.0, 4.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7506234645843506, -1.6942590475082397, -1.6378945112228394, -1.5815300941467285, -1.5251655578613281, -1.4688011407852173, -1.4124367237091064, -1.356072187423706, -1.2997076511383057, -1.2433432340621948, -1.1869786977767944, -1.1306142807006836, -1.0742497444152832, -1.0178853273391724, -0.9615208506584167, -0.9051563739776611, -0.8487919569015503, -0.7924274802207947, -0.7360630035400391, -0.6796985864639282, -0.6233340501785278, -0.566969633102417, -0.5106051564216614, -0.45424067974090576, -0.39787620306015015, -0.34151172637939453, -0.2851472496986389, -0.2287828028202057, -0.17241832613945007, -0.11605384945869446, -0.05968940258026123, -0.0033249258995056152, 0.05303955078125, 0.10940402001142502, 0.16576848924160004, 0.22213295102119446, 0.2784974277019501, 0.3348619043827057, 0.3912263512611389, 0.44759082794189453, 0.5039553046226501, 0.5603197813034058, 0.6166842579841614, 0.673048734664917, 0.7294131517410278, 0.7857776880264282, 0.8421421051025391, 0.8985065817832947, 0.9548710584640503, 1.0112354755401611, 1.0676000118255615, 1.1239644289016724, 1.1803289651870728, 1.2366933822631836, 1.293057918548584, 1.3494223356246948, 1.4057867527008057, 1.4621511697769165, 1.518515706062317, 1.5748801231384277, 1.6312446594238281, 1.687609076499939, 1.7439734935760498, 1.8003380298614502, 1.8567025661468506]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 5.0, 6.0, 26.0, 33.0, 44.0, 73.0, 115.0, 178.0, 303.0, 485.0, 870.0, 1567.0, 3192.0, 6556.0, 14953.0, 38076.0, 148837.0, 648629.0, 123952.0, 34320.0, 13725.0, 6221.0, 2932.0, 1432.0, 793.0, 477.0, 268.0, 165.0, 94.0, 71.0, 46.0, 41.0, 24.0, 10.0, 14.0, 5.0, 1.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.08203125, -2.0233001708984375, -1.964569091796875, -1.9058380126953125, -1.84710693359375, -1.7883758544921875, -1.729644775390625, -1.6709136962890625, -1.6121826171875, -1.5534515380859375, -1.494720458984375, -1.4359893798828125, -1.37725830078125, -1.3185272216796875, -1.259796142578125, -1.2010650634765625, -1.142333984375, -1.0836029052734375, -1.024871826171875, -0.9661407470703125, -0.90740966796875, -0.8486785888671875, -0.789947509765625, -0.7312164306640625, -0.6724853515625, -0.6137542724609375, -0.555023193359375, -0.4962921142578125, -0.43756103515625, -0.3788299560546875, -0.320098876953125, -0.2613677978515625, -0.20263671875, -0.1439056396484375, -0.085174560546875, -0.0264434814453125, 0.03228759765625, 0.0910186767578125, 0.149749755859375, 0.2084808349609375, 0.2672119140625, 0.3259429931640625, 0.384674072265625, 0.4434051513671875, 0.50213623046875, 0.5608673095703125, 0.619598388671875, 0.6783294677734375, 0.737060546875, 0.7957916259765625, 0.854522705078125, 0.9132537841796875, 0.97198486328125, 1.0307159423828125, 1.089447021484375, 1.1481781005859375, 1.2069091796875, 1.2656402587890625, 1.324371337890625, 1.3831024169921875, 1.44183349609375, 1.5005645751953125, 1.559295654296875, 1.6180267333984375, 1.6767578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 9.0, 4.0, 11.0, 12.0, 14.0, 13.0, 23.0, 30.0, 30.0, 31.0, 32.0, 41.0, 50.0, 40.0, 55.0, 52.0, 59.0, 59.0, 54.0, 51.0, 44.0, 46.0, 42.0, 41.0, 27.0, 17.0, 20.0, 19.0, 12.0, 6.0, 6.0, 13.0, 9.0, 9.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.933258056640625, -3.80792236328125, -3.682586669921875, -3.5572509765625, -3.431915283203125, -3.30657958984375, -3.181243896484375, -3.055908203125, -2.930572509765625, -2.80523681640625, -2.679901123046875, -2.5545654296875, -2.429229736328125, -2.30389404296875, -2.178558349609375, -2.05322265625, -1.927886962890625, -1.80255126953125, -1.677215576171875, -1.5518798828125, -1.426544189453125, -1.30120849609375, -1.175872802734375, -1.050537109375, -0.925201416015625, -0.79986572265625, -0.674530029296875, -0.5491943359375, -0.423858642578125, -0.29852294921875, -0.173187255859375, -0.0478515625, 0.077484130859375, 0.20281982421875, 0.328155517578125, 0.4534912109375, 0.578826904296875, 0.70416259765625, 0.829498291015625, 0.954833984375, 1.080169677734375, 1.20550537109375, 1.330841064453125, 1.4561767578125, 1.581512451171875, 1.70684814453125, 1.832183837890625, 1.95751953125, 2.082855224609375, 2.20819091796875, 2.333526611328125, 2.4588623046875, 2.584197998046875, 2.70953369140625, 2.834869384765625, 2.960205078125, 3.085540771484375, 3.21087646484375, 3.336212158203125, 3.4615478515625, 3.586883544921875, 3.71221923828125, 3.837554931640625, 3.962890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 6.0, 14.0, 20.0, 11.0, 24.0, 36.0, 52.0, 56.0, 89.0, 122.0, 191.0, 282.0, 547.0, 1316.0, 3793.0, 14688.0, 95901.0, 828529.0, 83213.0, 13514.0, 3559.0, 1167.0, 547.0, 267.0, 149.0, 122.0, 80.0, 69.0, 46.0, 32.0, 27.0, 14.0, 20.0, 13.0, 11.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.705078125, -3.603485107421875, -3.50189208984375, -3.400299072265625, -3.2987060546875, -3.197113037109375, -3.09552001953125, -2.993927001953125, -2.892333984375, -2.790740966796875, -2.68914794921875, -2.587554931640625, -2.4859619140625, -2.384368896484375, -2.28277587890625, -2.181182861328125, -2.07958984375, -1.977996826171875, -1.87640380859375, -1.774810791015625, -1.6732177734375, -1.571624755859375, -1.47003173828125, -1.368438720703125, -1.266845703125, -1.165252685546875, -1.06365966796875, -0.962066650390625, -0.8604736328125, -0.758880615234375, -0.65728759765625, -0.555694580078125, -0.4541015625, -0.352508544921875, -0.25091552734375, -0.149322509765625, -0.0477294921875, 0.053863525390625, 0.15545654296875, 0.257049560546875, 0.358642578125, 0.460235595703125, 0.56182861328125, 0.663421630859375, 0.7650146484375, 0.866607666015625, 0.96820068359375, 1.069793701171875, 1.17138671875, 1.272979736328125, 1.37457275390625, 1.476165771484375, 1.5777587890625, 1.679351806640625, 1.78094482421875, 1.882537841796875, 1.984130859375, 2.085723876953125, 2.18731689453125, 2.288909912109375, 2.3905029296875, 2.492095947265625, 2.59368896484375, 2.695281982421875, 2.796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 8.0, 6.0, 12.0, 10.0, 9.0, 11.0, 15.0, 18.0, 17.0, 21.0, 41.0, 31.0, 34.0, 28.0, 29.0, 46.0, 47.0, 37.0, 40.0, 44.0, 46.0, 53.0, 50.0, 44.0, 34.0, 38.0, 29.0, 43.0, 17.0, 28.0, 19.0, 23.0, 14.0, 13.0, 7.0, 6.0, 4.0, 10.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.0684814453125, -3.929931640625, -3.7913818359375, -3.65283203125, -3.5142822265625, -3.375732421875, -3.2371826171875, -3.0986328125, -2.9600830078125, -2.821533203125, -2.6829833984375, -2.54443359375, -2.4058837890625, -2.267333984375, -2.1287841796875, -1.990234375, -1.8516845703125, -1.713134765625, -1.5745849609375, -1.43603515625, -1.2974853515625, -1.158935546875, -1.0203857421875, -0.8818359375, -0.7432861328125, -0.604736328125, -0.4661865234375, -0.32763671875, -0.1890869140625, -0.050537109375, 0.0880126953125, 0.2265625, 0.3651123046875, 0.503662109375, 0.6422119140625, 0.78076171875, 0.9193115234375, 1.057861328125, 1.1964111328125, 1.3349609375, 1.4735107421875, 1.612060546875, 1.7506103515625, 1.88916015625, 2.0277099609375, 2.166259765625, 2.3048095703125, 2.443359375, 2.5819091796875, 2.720458984375, 2.8590087890625, 2.99755859375, 3.1361083984375, 3.274658203125, 3.4132080078125, 3.5517578125, 3.6903076171875, 3.828857421875, 3.9674072265625, 4.10595703125, 4.2445068359375, 4.383056640625, 4.5216064453125, 4.66015625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 24.0, 32.0, 39.0, 60.0, 86.0, 131.0, 274.0, 585.0, 1496.0, 4991.0, 26089.0, 299316.0, 665609.0, 39796.0, 6574.0, 1879.0, 723.0, 343.0, 179.0, 117.0, 62.0, 33.0, 27.0, 20.0, 17.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -1.00360107421875, -0.9691162109375, -0.93463134765625, -0.900146484375, -0.86566162109375, -0.8311767578125, -0.79669189453125, -0.76220703125, -0.72772216796875, -0.6932373046875, -0.65875244140625, -0.624267578125, -0.58978271484375, -0.5552978515625, -0.52081298828125, -0.486328125, -0.45184326171875, -0.4173583984375, -0.38287353515625, -0.348388671875, -0.31390380859375, -0.2794189453125, -0.24493408203125, -0.21044921875, -0.17596435546875, -0.1414794921875, -0.10699462890625, -0.072509765625, -0.03802490234375, -0.0035400390625, 0.03094482421875, 0.0654296875, 0.09991455078125, 0.1343994140625, 0.16888427734375, 0.203369140625, 0.23785400390625, 0.2723388671875, 0.30682373046875, 0.34130859375, 0.37579345703125, 0.4102783203125, 0.44476318359375, 0.479248046875, 0.51373291015625, 0.5482177734375, 0.58270263671875, 0.6171875, 0.65167236328125, 0.6861572265625, 0.72064208984375, 0.755126953125, 0.78961181640625, 0.8240966796875, 0.85858154296875, 0.89306640625, 0.92755126953125, 0.9620361328125, 0.99652099609375, 1.031005859375, 1.06549072265625, 1.0999755859375, 1.13446044921875, 1.1689453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 8.0, 4.0, 8.0, 16.0, 28.0, 24.0, 39.0, 44.0, 91.0, 136.0, 231.0, 121.0, 85.0, 37.0, 31.0, 32.0, 25.0, 8.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012171268463134766, -0.00011770427227020264, -0.00011369585990905762, -0.0001096874475479126, -0.00010567903518676758, -0.00010167062282562256, -9.766221046447754e-05, -9.365379810333252e-05, -8.96453857421875e-05, -8.563697338104248e-05, -8.162856101989746e-05, -7.762014865875244e-05, -7.361173629760742e-05, -6.96033239364624e-05, -6.559491157531738e-05, -6.158649921417236e-05, -5.7578086853027344e-05, -5.3569674491882324e-05, -4.9561262130737305e-05, -4.5552849769592285e-05, -4.1544437408447266e-05, -3.7536025047302246e-05, -3.3527612686157227e-05, -2.9519200325012207e-05, -2.5510787963867188e-05, -2.1502375602722168e-05, -1.749396324157715e-05, -1.3485550880432129e-05, -9.47713851928711e-06, -5.46872615814209e-06, -1.4603137969970703e-06, 2.5480985641479492e-06, 6.556510925292969e-06, 1.0564923286437988e-05, 1.4573335647583008e-05, 1.8581748008728027e-05, 2.2590160369873047e-05, 2.6598572731018066e-05, 3.0606985092163086e-05, 3.4615397453308105e-05, 3.8623809814453125e-05, 4.2632222175598145e-05, 4.6640634536743164e-05, 5.0649046897888184e-05, 5.46574592590332e-05, 5.866587162017822e-05, 6.267428398132324e-05, 6.668269634246826e-05, 7.069110870361328e-05, 7.46995210647583e-05, 7.870793342590332e-05, 8.271634578704834e-05, 8.672475814819336e-05, 9.073317050933838e-05, 9.47415828704834e-05, 9.874999523162842e-05, 0.00010275840759277344, 0.00010676681995391846, 0.00011077523231506348, 0.0001147836446762085, 0.00011879205703735352, 0.00012280046939849854, 0.00012680888175964355, 0.00013081729412078857, 0.0001348257064819336]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 9.0, 5.0, 9.0, 10.0, 18.0, 30.0, 43.0, 106.0, 226.0, 418.0, 1025.0, 3140.0, 16298.0, 237960.0, 748287.0, 33634.0, 4796.0, 1476.0, 539.0, 244.0, 117.0, 56.0, 33.0, 22.0, 14.0, 7.0, 3.0, 11.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.7685546875, -1.723388671875, -1.67822265625, -1.633056640625, -1.587890625, -1.542724609375, -1.49755859375, -1.452392578125, -1.4072265625, -1.362060546875, -1.31689453125, -1.271728515625, -1.2265625, -1.181396484375, -1.13623046875, -1.091064453125, -1.0458984375, -1.000732421875, -0.95556640625, -0.910400390625, -0.865234375, -0.820068359375, -0.77490234375, -0.729736328125, -0.6845703125, -0.639404296875, -0.59423828125, -0.549072265625, -0.50390625, -0.458740234375, -0.41357421875, -0.368408203125, -0.3232421875, -0.278076171875, -0.23291015625, -0.187744140625, -0.142578125, -0.097412109375, -0.05224609375, -0.007080078125, 0.0380859375, 0.083251953125, 0.12841796875, 0.173583984375, 0.21875, 0.263916015625, 0.30908203125, 0.354248046875, 0.3994140625, 0.444580078125, 0.48974609375, 0.534912109375, 0.580078125, 0.625244140625, 0.67041015625, 0.715576171875, 0.7607421875, 0.805908203125, 0.85107421875, 0.896240234375, 0.94140625, 0.986572265625, 1.03173828125, 1.076904296875, 1.1220703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 12.0, 20.0, 17.0, 19.0, 38.0, 49.0, 82.0, 132.0, 275.0, 117.0, 72.0, 46.0, 35.0, 15.0, 20.0, 13.0, 13.0, 7.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.457763671875, -0.4422264099121094, -0.42668914794921875, -0.4111518859863281, -0.3956146240234375, -0.3800773620605469, -0.36454010009765625, -0.3490028381347656, -0.333465576171875, -0.3179283142089844, -0.30239105224609375, -0.2868537902832031, -0.2713165283203125, -0.2557792663574219, -0.24024200439453125, -0.22470474243164062, -0.20916748046875, -0.19363021850585938, -0.17809295654296875, -0.16255569458007812, -0.1470184326171875, -0.13148117065429688, -0.11594390869140625, -0.10040664672851562, -0.084869384765625, -0.06933212280273438, -0.05379486083984375, -0.038257598876953125, -0.0227203369140625, -0.007183074951171875, 0.00835418701171875, 0.023891448974609375, 0.0394287109375, 0.054965972900390625, 0.07050323486328125, 0.08604049682617188, 0.1015777587890625, 0.11711502075195312, 0.13265228271484375, 0.14818954467773438, 0.163726806640625, 0.17926406860351562, 0.19480133056640625, 0.21033859252929688, 0.2258758544921875, 0.24141311645507812, 0.25695037841796875, 0.2724876403808594, 0.28802490234375, 0.3035621643066406, 0.31909942626953125, 0.3346366882324219, 0.3501739501953125, 0.3657112121582031, 0.38124847412109375, 0.3967857360839844, 0.412322998046875, 0.4278602600097656, 0.44339752197265625, 0.4589347839355469, 0.4744720458984375, 0.4900093078613281, 0.5055465698242188, 0.5210838317871094, 0.53662109375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 17.0, 14.0, 20.0, 52.0, 97.0, 178.0, 183.0, 170.0, 122.0, 65.0, 45.0, 24.0, 8.0, 11.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.51832389831543, -15.171737670898438, -14.825150489807129, -14.47856330871582, -14.131977081298828, -13.785390853881836, -13.438803672790527, -13.092216491699219, -12.745630264282227, -12.399044036865234, -12.052456855773926, -11.705869674682617, -11.359283447265625, -11.012697219848633, -10.666110038757324, -10.319522857666016, -9.972936630249023, -9.626350402832031, -9.279763221740723, -8.933176040649414, -8.586589813232422, -8.24000358581543, -7.893416404724121, -7.546829700469971, -7.20024299621582, -6.85365629196167, -6.5070695877075195, -6.160482883453369, -5.813896179199219, -5.467309474945068, -5.120722770690918, -4.774136066436768, -4.427548408508301, -4.08096170425415, -3.734375, -3.3877882957458496, -3.041201591491699, -2.694614887237549, -2.3480281829833984, -2.001441478729248, -1.6548547744750977, -1.3082680702209473, -0.9616813659667969, -0.6150946617126465, -0.2685079574584961, 0.0780787467956543, 0.4246654510498047, 0.7712521553039551, 1.1178388595581055, 1.4644255638122559, 1.8110122680664062, 2.1575989723205566, 2.504185676574707, 2.8507723808288574, 3.197359085083008, 3.543945789337158, 3.8905324935913086, 4.237119197845459, 4.583705902099609, 4.93029260635376, 5.27687931060791, 5.6234660148620605, 5.970052719116211, 6.316639423370361, 6.663226127624512]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 8.0, 8.0, 11.0, 7.0, 14.0, 12.0, 19.0, 21.0, 20.0, 15.0, 23.0, 24.0, 27.0, 17.0, 26.0, 29.0, 27.0, 33.0, 36.0, 39.0, 53.0, 34.0, 38.0, 36.0, 35.0, 33.0, 35.0, 31.0, 34.0, 41.0, 18.0, 24.0, 21.0, 23.0, 23.0, 20.0, 11.0, 12.0, 7.0, 5.0, 9.0, 7.0, 3.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-6.2397027015686035, -6.039177894592285, -5.838653564453125, -5.638128757476807, -5.4376044273376465, -5.237079620361328, -5.036555290222168, -4.83603048324585, -4.635505676269531, -4.434980869293213, -4.234456539154053, -4.033931732177734, -3.833407402038574, -3.632882595062256, -3.4323580265045166, -3.2318334579467773, -3.031309127807617, -2.830784559249878, -2.6302599906921387, -2.4297351837158203, -2.22921085357666, -2.028686046600342, -1.8281614780426025, -1.6276369094848633, -1.427112340927124, -1.2265877723693848, -1.0260632038116455, -0.8255385160446167, -0.6250139474868774, -0.4244893789291382, -0.22396469116210938, -0.023440122604370117, 0.17708396911621094, 0.3776085674762726, 0.5781331658363342, 0.7786577939987183, 0.9791823625564575, 1.1797069311141968, 1.3802316188812256, 1.5807561874389648, 1.781280755996704, 1.9818053245544434, 2.1823298931121826, 2.382854461669922, 2.5833792686462402, 2.7839035987854004, 2.9844284057617188, 3.184952974319458, 3.3854775428771973, 3.5860021114349365, 3.786526679992676, 3.987051486968994, 4.187575817108154, 4.388100624084473, 4.588624954223633, 4.789149761199951, 4.9896745681762695, 5.190199375152588, 5.390723705291748, 5.591248512268066, 5.791772842407227, 5.992297649383545, 6.192822456359863, 6.393346786499023, 6.593871116638184]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 12.0, 23.0, 42.0, 88.0, 203.0, 488.0, 1343.0, 4035.0, 17951.0, 233808.0, 3246645.0, 646977.0, 34332.0, 5648.0, 1662.0, 589.0, 227.0, 100.0, 47.0, 26.0, 11.0, 6.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.625, -5.447265625, -5.26953125, -5.091796875, -4.9140625, -4.736328125, -4.55859375, -4.380859375, -4.203125, -4.025390625, -3.84765625, -3.669921875, -3.4921875, -3.314453125, -3.13671875, -2.958984375, -2.78125, -2.603515625, -2.42578125, -2.248046875, -2.0703125, -1.892578125, -1.71484375, -1.537109375, -1.359375, -1.181640625, -1.00390625, -0.826171875, -0.6484375, -0.470703125, -0.29296875, -0.115234375, 0.0625, 0.240234375, 0.41796875, 0.595703125, 0.7734375, 0.951171875, 1.12890625, 1.306640625, 1.484375, 1.662109375, 1.83984375, 2.017578125, 2.1953125, 2.373046875, 2.55078125, 2.728515625, 2.90625, 3.083984375, 3.26171875, 3.439453125, 3.6171875, 3.794921875, 3.97265625, 4.150390625, 4.328125, 4.505859375, 4.68359375, 4.861328125, 5.0390625, 5.216796875, 5.39453125, 5.572265625, 5.75]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 4.0, 4.0, 8.0, 6.0, 8.0, 15.0, 19.0, 26.0, 30.0, 28.0, 27.0, 44.0, 53.0, 54.0, 53.0, 54.0, 60.0, 57.0, 48.0, 68.0, 52.0, 50.0, 52.0, 37.0, 30.0, 19.0, 21.0, 14.0, 8.0, 13.0, 10.0, 6.0, 6.0, 6.0, 1.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -2.9908447265625, -2.893798828125, -2.7967529296875, -2.69970703125, -2.6026611328125, -2.505615234375, -2.4085693359375, -2.3115234375, -2.2144775390625, -2.117431640625, -2.0203857421875, -1.92333984375, -1.8262939453125, -1.729248046875, -1.6322021484375, -1.53515625, -1.4381103515625, -1.341064453125, -1.2440185546875, -1.14697265625, -1.0499267578125, -0.952880859375, -0.8558349609375, -0.7587890625, -0.6617431640625, -0.564697265625, -0.4676513671875, -0.37060546875, -0.2735595703125, -0.176513671875, -0.0794677734375, 0.017578125, 0.1146240234375, 0.211669921875, 0.3087158203125, 0.40576171875, 0.5028076171875, 0.599853515625, 0.6968994140625, 0.7939453125, 0.8909912109375, 0.988037109375, 1.0850830078125, 1.18212890625, 1.2791748046875, 1.376220703125, 1.4732666015625, 1.5703125, 1.6673583984375, 1.764404296875, 1.8614501953125, 1.95849609375, 2.0555419921875, 2.152587890625, 2.2496337890625, 2.3466796875, 2.4437255859375, 2.540771484375, 2.6378173828125, 2.73486328125, 2.8319091796875, 2.928955078125, 3.0260009765625, 3.123046875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 10.0, 7.0, 22.0, 28.0, 48.0, 81.0, 99.0, 150.0, 247.0, 473.0, 1069.0, 2834.0, 10449.0, 75229.0, 3405823.0, 657616.0, 30383.0, 6107.0, 1888.0, 778.0, 378.0, 185.0, 120.0, 66.0, 48.0, 35.0, 25.0, 19.0, 13.0, 8.0, 7.0, 7.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.30303955078125, -4.1295166015625, -3.95599365234375, -3.782470703125, -3.60894775390625, -3.4354248046875, -3.26190185546875, -3.08837890625, -2.91485595703125, -2.7413330078125, -2.56781005859375, -2.394287109375, -2.22076416015625, -2.0472412109375, -1.87371826171875, -1.7001953125, -1.52667236328125, -1.3531494140625, -1.17962646484375, -1.006103515625, -0.83258056640625, -0.6590576171875, -0.48553466796875, -0.31201171875, -0.13848876953125, 0.0350341796875, 0.20855712890625, 0.382080078125, 0.55560302734375, 0.7291259765625, 0.90264892578125, 1.076171875, 1.24969482421875, 1.4232177734375, 1.59674072265625, 1.770263671875, 1.94378662109375, 2.1173095703125, 2.29083251953125, 2.46435546875, 2.63787841796875, 2.8114013671875, 2.98492431640625, 3.158447265625, 3.33197021484375, 3.5054931640625, 3.67901611328125, 3.8525390625, 4.02606201171875, 4.1995849609375, 4.37310791015625, 4.546630859375, 4.72015380859375, 4.8936767578125, 5.06719970703125, 5.24072265625, 5.41424560546875, 5.5877685546875, 5.76129150390625, 5.934814453125, 6.10833740234375, 6.2818603515625, 6.45538330078125, 6.62890625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 9.0, 5.0, 13.0, 14.0, 19.0, 29.0, 58.0, 88.0, 196.0, 359.0, 680.0, 865.0, 792.0, 432.0, 209.0, 111.0, 64.0, 36.0, 25.0, 17.0, 11.0, 10.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4033203125, -1.355865478515625, -1.30841064453125, -1.260955810546875, -1.2135009765625, -1.166046142578125, -1.11859130859375, -1.071136474609375, -1.023681640625, -0.976226806640625, -0.92877197265625, -0.881317138671875, -0.8338623046875, -0.786407470703125, -0.73895263671875, -0.691497802734375, -0.64404296875, -0.596588134765625, -0.54913330078125, -0.501678466796875, -0.4542236328125, -0.406768798828125, -0.35931396484375, -0.311859130859375, -0.264404296875, -0.216949462890625, -0.16949462890625, -0.122039794921875, -0.0745849609375, -0.027130126953125, 0.02032470703125, 0.067779541015625, 0.115234375, 0.162689208984375, 0.21014404296875, 0.257598876953125, 0.3050537109375, 0.352508544921875, 0.39996337890625, 0.447418212890625, 0.494873046875, 0.542327880859375, 0.58978271484375, 0.637237548828125, 0.6846923828125, 0.732147216796875, 0.77960205078125, 0.827056884765625, 0.87451171875, 0.921966552734375, 0.96942138671875, 1.016876220703125, 1.0643310546875, 1.111785888671875, 1.15924072265625, 1.206695556640625, 1.254150390625, 1.301605224609375, 1.34906005859375, 1.396514892578125, 1.4439697265625, 1.491424560546875, 1.53887939453125, 1.586334228515625, 1.6337890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 8.0, 11.0, 13.0, 20.0, 29.0, 42.0, 63.0, 85.0, 104.0, 120.0, 122.0, 100.0, 85.0, 65.0, 46.0, 40.0, 19.0, 7.0, 13.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.730464458465576, -5.562582969665527, -5.39470100402832, -5.2268195152282715, -5.0589375495910645, -4.891056060791016, -4.723174095153809, -4.55529260635376, -4.387411117553711, -4.219529628753662, -4.051647663116455, -3.8837661743164062, -3.7158844470977783, -3.5480027198791504, -3.3801209926605225, -3.2122392654418945, -3.0443575382232666, -2.8764758110046387, -2.7085940837860107, -2.540712356567383, -2.372830867767334, -2.204949140548706, -2.037067413330078, -1.8691858053207397, -1.7013040781021118, -1.5334223508834839, -1.3655407428741455, -1.1976590156555176, -1.0297772884368896, -0.8618956804275513, -0.6940139532089233, -0.526132345199585, -0.35825061798095703, -0.19036893546581268, -0.022487252950668335, 0.1453944444656372, 0.31327611207962036, 0.4811577796936035, 0.6490395069122314, 0.8169211149215698, 0.9848028421401978, 1.1526845693588257, 1.320566177368164, 1.488447904586792, 1.65632963180542, 1.8242112398147583, 1.9920929670333862, 2.1599745750427246, 2.3278563022613525, 2.4957380294799805, 2.6636197566986084, 2.8315014839172363, 2.999382972717285, 3.167264699935913, 3.335146427154541, 3.50302791595459, 3.670909881591797, 3.838791608810425, 4.006673336029053, 4.174554824829102, 4.342436790466309, 4.510318279266357, 4.678199768066406, 4.846081733703613, 5.013963222503662]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 4.0, 1.0, 5.0, 10.0, 8.0, 10.0, 11.0, 30.0, 21.0, 24.0, 24.0, 21.0, 36.0, 31.0, 31.0, 43.0, 33.0, 52.0, 52.0, 41.0, 46.0, 45.0, 48.0, 44.0, 36.0, 39.0, 30.0, 39.0, 36.0, 31.0, 18.0, 17.0, 10.0, 14.0, 13.0, 15.0, 5.0, 5.0, 4.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.6991169452667236, -2.611685276031494, -2.5242536067962646, -2.436821937561035, -2.3493902683258057, -2.261958599090576, -2.1745266914367676, -2.087095260620117, -1.9996634721755981, -1.9122318029403687, -1.8248001337051392, -1.7373683452606201, -1.6499366760253906, -1.5625050067901611, -1.4750733375549316, -1.3876416683197021, -1.3002099990844727, -1.2127783298492432, -1.1253466606140137, -1.0379149913787842, -0.9504832625389099, -0.8630515933036804, -0.7756198644638062, -0.6881881952285767, -0.6007565259933472, -0.5133248567581177, -0.4258931577205658, -0.3384614586830139, -0.2510297894477844, -0.16359812021255493, -0.07616639137268066, 0.011265277862548828, 0.09869670867919922, 0.1861283928155899, 0.2735600769519806, 0.36099177598953247, 0.44842344522476196, 0.5358551144599915, 0.6232868432998657, 0.7107185125350952, 0.7981501817703247, 0.8855818510055542, 0.9730135202407837, 1.0604453086853027, 1.1478769779205322, 1.2353086471557617, 1.3227403163909912, 1.4101719856262207, 1.4976036548614502, 1.5850353240966797, 1.6724669933319092, 1.7598986625671387, 1.8473303318023682, 1.9347620010375977, 2.0221939086914062, 2.1096253395080566, 2.1970572471618652, 2.2844889163970947, 2.371920585632324, 2.4593522548675537, 2.546783924102783, 2.6342155933380127, 2.721647262573242, 2.809079170227051, 2.896510601043701]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 14.0, 31.0, 37.0, 51.0, 85.0, 148.0, 296.0, 647.0, 1527.0, 5323.0, 23969.0, 163837.0, 719710.0, 108554.0, 17722.0, 4146.0, 1329.0, 520.0, 238.0, 142.0, 78.0, 50.0, 28.0, 14.0, 16.0, 11.0, 13.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91064453125, -0.8833847045898438, -0.8561248779296875, -0.8288650512695312, -0.801605224609375, -0.7743453979492188, -0.7470855712890625, -0.7198257446289062, -0.69256591796875, -0.6653060913085938, -0.6380462646484375, -0.6107864379882812, -0.583526611328125, -0.5562667846679688, -0.5290069580078125, -0.5017471313476562, -0.4744873046875, -0.44722747802734375, -0.4199676513671875, -0.39270782470703125, -0.365447998046875, -0.33818817138671875, -0.3109283447265625, -0.28366851806640625, -0.25640869140625, -0.22914886474609375, -0.2018890380859375, -0.17462921142578125, -0.147369384765625, -0.12010955810546875, -0.0928497314453125, -0.06558990478515625, -0.038330078125, -0.01107025146484375, 0.0161895751953125, 0.04344940185546875, 0.070709228515625, 0.09796905517578125, 0.1252288818359375, 0.15248870849609375, 0.17974853515625, 0.20700836181640625, 0.2342681884765625, 0.26152801513671875, 0.288787841796875, 0.31604766845703125, 0.3433074951171875, 0.37056732177734375, 0.3978271484375, 0.42508697509765625, 0.4523468017578125, 0.47960662841796875, 0.506866455078125, 0.5341262817382812, 0.5613861083984375, 0.5886459350585938, 0.61590576171875, 0.6431655883789062, 0.6704254150390625, 0.6976852416992188, 0.724945068359375, 0.7522048950195312, 0.7794647216796875, 0.8067245483398438, 0.833984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 12.0, 13.0, 17.0, 25.0, 35.0, 39.0, 38.0, 36.0, 67.0, 63.0, 66.0, 78.0, 59.0, 66.0, 74.0, 71.0, 54.0, 41.0, 35.0, 24.0, 26.0, 15.0, 6.0, 13.0, 4.0, 5.0, 9.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921875, -2.904083251953125, -2.81597900390625, -2.727874755859375, -2.6397705078125, -2.551666259765625, -2.46356201171875, -2.375457763671875, -2.287353515625, -2.199249267578125, -2.11114501953125, -2.023040771484375, -1.9349365234375, -1.846832275390625, -1.75872802734375, -1.670623779296875, -1.58251953125, -1.494415283203125, -1.40631103515625, -1.318206787109375, -1.2301025390625, -1.141998291015625, -1.05389404296875, -0.965789794921875, -0.877685546875, -0.789581298828125, -0.70147705078125, -0.613372802734375, -0.5252685546875, -0.437164306640625, -0.34906005859375, -0.260955810546875, -0.1728515625, -0.084747314453125, 0.00335693359375, 0.091461181640625, 0.1795654296875, 0.267669677734375, 0.35577392578125, 0.443878173828125, 0.531982421875, 0.620086669921875, 0.70819091796875, 0.796295166015625, 0.8843994140625, 0.972503662109375, 1.06060791015625, 1.148712158203125, 1.23681640625, 1.324920654296875, 1.41302490234375, 1.501129150390625, 1.5892333984375, 1.677337646484375, 1.76544189453125, 1.853546142578125, 1.941650390625, 2.029754638671875, 2.11785888671875, 2.205963134765625, 2.2940673828125, 2.382171630859375, 2.47027587890625, 2.558380126953125, 2.646484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 9.0, 21.0, 23.0, 42.0, 41.0, 90.0, 109.0, 164.0, 266.0, 323.0, 481.0, 753.0, 1138.0, 1787.0, 2831.0, 4514.0, 7258.0, 12680.0, 22300.0, 41986.0, 83573.0, 184503.0, 303084.0, 190981.0, 88256.0, 44090.0, 23383.0, 13195.0, 7753.0, 4669.0, 2799.0, 1802.0, 1218.0, 783.0, 532.0, 360.0, 227.0, 176.0, 107.0, 82.0, 50.0, 31.0, 30.0, 12.0, 12.0, 7.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.1973876953125, -0.1914997100830078, -0.18561172485351562, -0.17972373962402344, -0.17383575439453125, -0.16794776916503906, -0.16205978393554688, -0.1561717987060547, -0.1502838134765625, -0.1443958282470703, -0.13850784301757812, -0.13261985778808594, -0.12673187255859375, -0.12084388732910156, -0.11495590209960938, -0.10906791687011719, -0.103179931640625, -0.09729194641113281, -0.09140396118164062, -0.08551597595214844, -0.07962799072265625, -0.07374000549316406, -0.06785202026367188, -0.06196403503417969, -0.0560760498046875, -0.05018806457519531, -0.044300079345703125, -0.03841209411621094, -0.03252410888671875, -0.026636123657226562, -0.020748138427734375, -0.014860153198242188, -0.00897216796875, -0.0030841827392578125, 0.002803802490234375, 0.008691787719726562, 0.01457977294921875, 0.020467758178710938, 0.026355743408203125, 0.03224372863769531, 0.0381317138671875, 0.04401969909667969, 0.049907684326171875, 0.05579566955566406, 0.06168365478515625, 0.06757164001464844, 0.07345962524414062, 0.07934761047363281, 0.085235595703125, 0.09112358093261719, 0.09701156616210938, 0.10289955139160156, 0.10878753662109375, 0.11467552185058594, 0.12056350708007812, 0.1264514923095703, 0.1323394775390625, 0.1382274627685547, 0.14411544799804688, 0.15000343322753906, 0.15589141845703125, 0.16177940368652344, 0.16766738891601562, 0.1735553741455078, 0.179443359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 6.0, 9.0, 7.0, 14.0, 19.0, 17.0, 21.0, 25.0, 24.0, 27.0, 29.0, 28.0, 46.0, 52.0, 30.0, 45.0, 49.0, 44.0, 38.0, 41.0, 46.0, 55.0, 39.0, 42.0, 39.0, 30.0, 20.0, 26.0, 18.0, 23.0, 19.0, 12.0, 10.0, 7.0, 2.0, 6.0, 8.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.9453125, -3.829132080078125, -3.71295166015625, -3.596771240234375, -3.4805908203125, -3.364410400390625, -3.24822998046875, -3.132049560546875, -3.015869140625, -2.899688720703125, -2.78350830078125, -2.667327880859375, -2.5511474609375, -2.434967041015625, -2.31878662109375, -2.202606201171875, -2.08642578125, -1.970245361328125, -1.85406494140625, -1.737884521484375, -1.6217041015625, -1.505523681640625, -1.38934326171875, -1.273162841796875, -1.156982421875, -1.040802001953125, -0.92462158203125, -0.808441162109375, -0.6922607421875, -0.576080322265625, -0.45989990234375, -0.343719482421875, -0.2275390625, -0.111358642578125, 0.00482177734375, 0.121002197265625, 0.2371826171875, 0.353363037109375, 0.46954345703125, 0.585723876953125, 0.701904296875, 0.818084716796875, 0.93426513671875, 1.050445556640625, 1.1666259765625, 1.282806396484375, 1.39898681640625, 1.515167236328125, 1.63134765625, 1.747528076171875, 1.86370849609375, 1.979888916015625, 2.0960693359375, 2.212249755859375, 2.32843017578125, 2.444610595703125, 2.560791015625, 2.676971435546875, 2.79315185546875, 2.909332275390625, 3.0255126953125, 3.141693115234375, 3.25787353515625, 3.374053955078125, 3.490234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 14.0, 11.0, 16.0, 37.0, 40.0, 67.0, 92.0, 154.0, 235.0, 345.0, 853.0, 2579.0, 12839.0, 221399.0, 775630.0, 27684.0, 4365.0, 1122.0, 410.0, 241.0, 145.0, 100.0, 57.0, 35.0, 25.0, 18.0, 5.0, 8.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.117431640625, -0.1138906478881836, -0.11034965515136719, -0.10680866241455078, -0.10326766967773438, -0.09972667694091797, -0.09618568420410156, -0.09264469146728516, -0.08910369873046875, -0.08556270599365234, -0.08202171325683594, -0.07848072052001953, -0.07493972778320312, -0.07139873504638672, -0.06785774230957031, -0.0643167495727539, -0.0607757568359375, -0.057234764099121094, -0.05369377136230469, -0.05015277862548828, -0.046611785888671875, -0.04307079315185547, -0.03952980041503906, -0.035988807678222656, -0.03244781494140625, -0.028906822204589844, -0.025365829467773438, -0.02182483673095703, -0.018283843994140625, -0.014742851257324219, -0.011201858520507812, -0.007660865783691406, -0.004119873046875, -0.0005788803100585938, 0.0029621124267578125, 0.006503105163574219, 0.010044097900390625, 0.013585090637207031, 0.017126083374023438, 0.020667076110839844, 0.02420806884765625, 0.027749061584472656, 0.03129005432128906, 0.03483104705810547, 0.038372039794921875, 0.04191303253173828, 0.04545402526855469, 0.048995018005371094, 0.0525360107421875, 0.056077003479003906, 0.05961799621582031, 0.06315898895263672, 0.06669998168945312, 0.07024097442626953, 0.07378196716308594, 0.07732295989990234, 0.08086395263671875, 0.08440494537353516, 0.08794593811035156, 0.09148693084716797, 0.09502792358398438, 0.09856891632080078, 0.10210990905761719, 0.1056509017944336, 0.10919189453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 3.0, 13.0, 4.0, 10.0, 20.0, 30.0, 42.0, 74.0, 91.0, 91.0, 136.0, 120.0, 94.0, 79.0, 48.0, 40.0, 15.0, 25.0, 17.0, 11.0, 13.0, 4.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.6803226470947266e-05, -5.5264681577682495e-05, -5.3726136684417725e-05, -5.2187591791152954e-05, -5.0649046897888184e-05, -4.911050200462341e-05, -4.757195711135864e-05, -4.603341221809387e-05, -4.44948673248291e-05, -4.295632243156433e-05, -4.141777753829956e-05, -3.987923264503479e-05, -3.834068775177002e-05, -3.680214285850525e-05, -3.526359796524048e-05, -3.372505307197571e-05, -3.218650817871094e-05, -3.064796328544617e-05, -2.9109418392181396e-05, -2.7570873498916626e-05, -2.6032328605651855e-05, -2.4493783712387085e-05, -2.2955238819122314e-05, -2.1416693925857544e-05, -1.9878149032592773e-05, -1.8339604139328003e-05, -1.6801059246063232e-05, -1.5262514352798462e-05, -1.3723969459533691e-05, -1.2185424566268921e-05, -1.064687967300415e-05, -9.10833477973938e-06, -7.569789886474609e-06, -6.031244993209839e-06, -4.492700099945068e-06, -2.954155206680298e-06, -1.4156103134155273e-06, 1.2293457984924316e-07, 1.6614794731140137e-06, 3.200024366378784e-06, 4.738569259643555e-06, 6.277114152908325e-06, 7.815659046173096e-06, 9.354203939437866e-06, 1.0892748832702637e-05, 1.2431293725967407e-05, 1.3969838619232178e-05, 1.5508383512496948e-05, 1.704692840576172e-05, 1.858547329902649e-05, 2.012401819229126e-05, 2.166256308555603e-05, 2.32011079788208e-05, 2.473965287208557e-05, 2.6278197765350342e-05, 2.7816742658615112e-05, 2.9355287551879883e-05, 3.089383244514465e-05, 3.2432377338409424e-05, 3.3970922231674194e-05, 3.5509467124938965e-05, 3.7048012018203735e-05, 3.8586556911468506e-05, 4.0125101804733276e-05, 4.166364669799805e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 1.0, 6.0, 7.0, 7.0, 14.0, 12.0, 27.0, 26.0, 30.0, 41.0, 67.0, 97.0, 161.0, 379.0, 1079.0, 4206.0, 30719.0, 886848.0, 112824.0, 8948.0, 1847.0, 605.0, 226.0, 128.0, 76.0, 45.0, 34.0, 22.0, 19.0, 11.0, 9.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1207275390625, -0.11603164672851562, -0.11133575439453125, -0.10663986206054688, -0.1019439697265625, -0.09724807739257812, -0.09255218505859375, -0.08785629272460938, -0.083160400390625, -0.07846450805664062, -0.07376861572265625, -0.06907272338867188, -0.0643768310546875, -0.059680938720703125, -0.05498504638671875, -0.050289154052734375, -0.04559326171875, -0.040897369384765625, -0.03620147705078125, -0.031505584716796875, -0.0268096923828125, -0.022113800048828125, -0.01741790771484375, -0.012722015380859375, -0.008026123046875, -0.003330230712890625, 0.00136566162109375, 0.006061553955078125, 0.0107574462890625, 0.015453338623046875, 0.02014923095703125, 0.024845123291015625, 0.029541015625, 0.034236907958984375, 0.03893280029296875, 0.043628692626953125, 0.0483245849609375, 0.053020477294921875, 0.05771636962890625, 0.062412261962890625, 0.067108154296875, 0.07180404663085938, 0.07649993896484375, 0.08119583129882812, 0.0858917236328125, 0.09058761596679688, 0.09528350830078125, 0.09997940063476562, 0.10467529296875, 0.10937118530273438, 0.11406707763671875, 0.11876296997070312, 0.1234588623046875, 0.12815475463867188, 0.13285064697265625, 0.13754653930664062, 0.142242431640625, 0.14693832397460938, 0.15163421630859375, 0.15633010864257812, 0.1610260009765625, 0.16572189331054688, 0.17041778564453125, 0.17511367797851562, 0.1798095703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 13.0, 18.0, 45.0, 103.0, 330.0, 295.0, 103.0, 54.0, 16.0, 10.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0645751953125, -0.062957763671875, -0.06134033203125, -0.059722900390625, -0.05810546875, -0.056488037109375, -0.05487060546875, -0.053253173828125, -0.0516357421875, -0.050018310546875, -0.04840087890625, -0.046783447265625, -0.045166015625, -0.043548583984375, -0.04193115234375, -0.040313720703125, -0.0386962890625, -0.037078857421875, -0.03546142578125, -0.033843994140625, -0.0322265625, -0.030609130859375, -0.02899169921875, -0.027374267578125, -0.0257568359375, -0.024139404296875, -0.02252197265625, -0.020904541015625, -0.019287109375, -0.017669677734375, -0.01605224609375, -0.014434814453125, -0.0128173828125, -0.011199951171875, -0.00958251953125, -0.007965087890625, -0.00634765625, -0.004730224609375, -0.00311279296875, -0.001495361328125, 0.0001220703125, 0.001739501953125, 0.00335693359375, 0.004974365234375, 0.006591796875, 0.008209228515625, 0.00982666015625, 0.011444091796875, 0.0130615234375, 0.014678955078125, 0.01629638671875, 0.017913818359375, 0.01953125, 0.021148681640625, 0.02276611328125, 0.024383544921875, 0.0260009765625, 0.027618408203125, 0.02923583984375, 0.030853271484375, 0.032470703125, 0.034088134765625, 0.03570556640625, 0.037322998046875, 0.0389404296875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 18.0, 15.0, 37.0, 70.0, 144.0, 178.0, 204.0, 137.0, 90.0, 55.0, 28.0, 13.0, 9.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.498447418212891, -7.328708171844482, -7.158968925476074, -6.989229202270508, -6.8194899559021, -6.649750709533691, -6.480011463165283, -6.310272216796875, -6.140532493591309, -5.9707932472229, -5.801054000854492, -5.631314277648926, -5.461575031280518, -5.291835784912109, -5.122096538543701, -4.952357292175293, -4.782618045806885, -4.612878799438477, -4.443139553070068, -4.27340030670166, -4.103660583496094, -3.9339213371276855, -3.7641820907592773, -3.594442844390869, -3.424703359603882, -3.2549641132354736, -3.0852246284484863, -2.915485382080078, -2.74574613571167, -2.5760066509246826, -2.4062674045562744, -2.236527919769287, -2.0667881965637207, -1.897048830986023, -1.7273094654083252, -1.557570219039917, -1.3878308534622192, -1.2180914878845215, -1.0483522415161133, -0.8786128759384155, -0.7088735103607178, -0.53913414478302, -0.36939483880996704, -0.19965553283691406, -0.02991616725921631, 0.13982319831848145, 0.30956244468688965, 0.4793018102645874, 0.6490411758422852, 0.8187805414199829, 0.9885198473930359, 1.1582591533660889, 1.3279985189437866, 1.4977378845214844, 1.6674771308898926, 1.8372164964675903, 2.006955862045288, 2.1766951084136963, 2.3464345932006836, 2.516173839569092, 2.6859130859375, 2.8556525707244873, 3.0253918170928955, 3.195131301879883, 3.364870548248291]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 6.0, 7.0, 15.0, 19.0, 30.0, 37.0, 27.0, 37.0, 43.0, 58.0, 51.0, 65.0, 71.0, 65.0, 61.0, 66.0, 52.0, 40.0, 51.0, 52.0, 34.0, 22.0, 14.0, 20.0, 12.0, 11.0, 5.0, 10.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6339807510375977, -2.557360887527466, -2.480741262435913, -2.4041213989257812, -2.3275017738342285, -2.2508819103240967, -2.174262285232544, -2.097642421722412, -2.0210227966308594, -1.944403052330017, -1.8677833080291748, -1.7911635637283325, -1.7145438194274902, -1.6379239559173584, -1.5613042116165161, -1.4846844673156738, -1.408064603805542, -1.3314448595046997, -1.2548251152038574, -1.1782053709030151, -1.1015856266021729, -1.024965763092041, -0.9483460187911987, -0.8717262744903564, -0.7951065301895142, -0.7184867858886719, -0.6418670415878296, -0.5652472376823425, -0.48862749338150024, -0.41200774908065796, -0.3353879749774933, -0.2587682008743286, -0.18214821815490723, -0.10552845895290375, -0.02890869975090027, 0.04771105945110321, 0.12433081865310669, 0.20095056295394897, 0.27757033705711365, 0.3541901111602783, 0.4308098554611206, 0.5074295997619629, 0.5840493440628052, 0.6606691479682922, 0.7372888922691345, 0.8139086365699768, 0.8905284404754639, 0.9671481847763062, 1.0437679290771484, 1.1203876733779907, 1.197007417678833, 1.2736271619796753, 1.3502469062805176, 1.4268667697906494, 1.5034865140914917, 1.580106258392334, 1.6567260026931763, 1.7333457469940186, 1.8099654912948608, 1.8865852355957031, 1.963205099105835, 2.0398247241973877, 2.1164445877075195, 2.1930642127990723, 2.269684076309204]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 1.0, 1.0, 6.0, 5.0, 4.0, 4.0, 16.0, 16.0, 15.0, 27.0, 40.0, 51.0, 80.0, 128.0, 184.0, 292.0, 514.0, 847.0, 1508.0, 2831.0, 6137.0, 16108.0, 61619.0, 426962.0, 438931.0, 62934.0, 16276.0, 6273.0, 2969.0, 1492.0, 857.0, 526.0, 291.0, 190.0, 133.0, 84.0, 68.0, 40.0, 32.0, 16.0, 6.0, 8.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.47265625, -1.42803955078125, -1.3834228515625, -1.33880615234375, -1.294189453125, -1.24957275390625, -1.2049560546875, -1.16033935546875, -1.11572265625, -1.07110595703125, -1.0264892578125, -0.98187255859375, -0.937255859375, -0.89263916015625, -0.8480224609375, -0.80340576171875, -0.7587890625, -0.71417236328125, -0.6695556640625, -0.62493896484375, -0.580322265625, -0.53570556640625, -0.4910888671875, -0.44647216796875, -0.40185546875, -0.35723876953125, -0.3126220703125, -0.26800537109375, -0.223388671875, -0.17877197265625, -0.1341552734375, -0.08953857421875, -0.044921875, -0.00030517578125, 0.0443115234375, 0.08892822265625, 0.133544921875, 0.17816162109375, 0.2227783203125, 0.26739501953125, 0.31201171875, 0.35662841796875, 0.4012451171875, 0.44586181640625, 0.490478515625, 0.53509521484375, 0.5797119140625, 0.62432861328125, 0.6689453125, 0.71356201171875, 0.7581787109375, 0.80279541015625, 0.847412109375, 0.89202880859375, 0.9366455078125, 0.98126220703125, 1.02587890625, 1.07049560546875, 1.1151123046875, 1.15972900390625, 1.204345703125, 1.24896240234375, 1.2935791015625, 1.33819580078125, 1.3828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 3.0, 0.0, 7.0, 10.0, 12.0, 16.0, 18.0, 31.0, 35.0, 38.0, 59.0, 43.0, 50.0, 57.0, 80.0, 58.0, 71.0, 45.0, 70.0, 59.0, 59.0, 43.0, 35.0, 19.0, 22.0, 16.0, 8.0, 14.0, 8.0, 8.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.99609375, -5.832275390625, -5.66845703125, -5.504638671875, -5.3408203125, -5.177001953125, -5.01318359375, -4.849365234375, -4.685546875, -4.521728515625, -4.35791015625, -4.194091796875, -4.0302734375, -3.866455078125, -3.70263671875, -3.538818359375, -3.375, -3.211181640625, -3.04736328125, -2.883544921875, -2.7197265625, -2.555908203125, -2.39208984375, -2.228271484375, -2.064453125, -1.900634765625, -1.73681640625, -1.572998046875, -1.4091796875, -1.245361328125, -1.08154296875, -0.917724609375, -0.75390625, -0.590087890625, -0.42626953125, -0.262451171875, -0.0986328125, 0.065185546875, 0.22900390625, 0.392822265625, 0.556640625, 0.720458984375, 0.88427734375, 1.048095703125, 1.2119140625, 1.375732421875, 1.53955078125, 1.703369140625, 1.8671875, 2.031005859375, 2.19482421875, 2.358642578125, 2.5224609375, 2.686279296875, 2.85009765625, 3.013916015625, 3.177734375, 3.341552734375, 3.50537109375, 3.669189453125, 3.8330078125, 3.996826171875, 4.16064453125, 4.324462890625, 4.48828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 15.0, 18.0, 8.0, 18.0, 23.0, 32.0, 38.0, 59.0, 83.0, 109.0, 182.0, 295.0, 599.0, 1358.0, 4351.0, 29573.0, 890590.0, 109427.0, 7763.0, 2097.0, 814.0, 375.0, 222.0, 131.0, 94.0, 60.0, 55.0, 39.0, 21.0, 20.0, 15.0, 14.0, 13.0, 7.0, 7.0, 2.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.833984375, -2.74163818359375, -2.6492919921875, -2.55694580078125, -2.464599609375, -2.37225341796875, -2.2799072265625, -2.18756103515625, -2.09521484375, -2.00286865234375, -1.9105224609375, -1.81817626953125, -1.725830078125, -1.63348388671875, -1.5411376953125, -1.44879150390625, -1.3564453125, -1.26409912109375, -1.1717529296875, -1.07940673828125, -0.987060546875, -0.89471435546875, -0.8023681640625, -0.71002197265625, -0.61767578125, -0.52532958984375, -0.4329833984375, -0.34063720703125, -0.248291015625, -0.15594482421875, -0.0635986328125, 0.02874755859375, 0.12109375, 0.21343994140625, 0.3057861328125, 0.39813232421875, 0.490478515625, 0.58282470703125, 0.6751708984375, 0.76751708984375, 0.85986328125, 0.95220947265625, 1.0445556640625, 1.13690185546875, 1.229248046875, 1.32159423828125, 1.4139404296875, 1.50628662109375, 1.5986328125, 1.69097900390625, 1.7833251953125, 1.87567138671875, 1.968017578125, 2.06036376953125, 2.1527099609375, 2.24505615234375, 2.33740234375, 2.42974853515625, 2.5220947265625, 2.61444091796875, 2.706787109375, 2.79913330078125, 2.8914794921875, 2.98382568359375, 3.076171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 11.0, 12.0, 17.0, 17.0, 26.0, 18.0, 31.0, 33.0, 39.0, 23.0, 37.0, 49.0, 53.0, 45.0, 50.0, 48.0, 40.0, 62.0, 38.0, 43.0, 42.0, 31.0, 33.0, 24.0, 28.0, 27.0, 17.0, 17.0, 10.0, 11.0, 16.0, 5.0, 1.0, 5.0, 4.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.97265625, -4.8232421875, -4.673828125, -4.5244140625, -4.375, -4.2255859375, -4.076171875, -3.9267578125, -3.77734375, -3.6279296875, -3.478515625, -3.3291015625, -3.1796875, -3.0302734375, -2.880859375, -2.7314453125, -2.58203125, -2.4326171875, -2.283203125, -2.1337890625, -1.984375, -1.8349609375, -1.685546875, -1.5361328125, -1.38671875, -1.2373046875, -1.087890625, -0.9384765625, -0.7890625, -0.6396484375, -0.490234375, -0.3408203125, -0.19140625, -0.0419921875, 0.107421875, 0.2568359375, 0.40625, 0.5556640625, 0.705078125, 0.8544921875, 1.00390625, 1.1533203125, 1.302734375, 1.4521484375, 1.6015625, 1.7509765625, 1.900390625, 2.0498046875, 2.19921875, 2.3486328125, 2.498046875, 2.6474609375, 2.796875, 2.9462890625, 3.095703125, 3.2451171875, 3.39453125, 3.5439453125, 3.693359375, 3.8427734375, 3.9921875, 4.1416015625, 4.291015625, 4.4404296875, 4.58984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 8.0, 14.0, 35.0, 46.0, 99.0, 204.0, 524.0, 1725.0, 9896.0, 622394.0, 401406.0, 9595.0, 1676.0, 511.0, 215.0, 84.0, 50.0, 22.0, 10.0, 10.0, 6.0, 6.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6533203125, -1.60980224609375, -1.5662841796875, -1.52276611328125, -1.479248046875, -1.43572998046875, -1.3922119140625, -1.34869384765625, -1.30517578125, -1.26165771484375, -1.2181396484375, -1.17462158203125, -1.131103515625, -1.08758544921875, -1.0440673828125, -1.00054931640625, -0.95703125, -0.91351318359375, -0.8699951171875, -0.82647705078125, -0.782958984375, -0.73944091796875, -0.6959228515625, -0.65240478515625, -0.60888671875, -0.56536865234375, -0.5218505859375, -0.47833251953125, -0.434814453125, -0.39129638671875, -0.3477783203125, -0.30426025390625, -0.2607421875, -0.21722412109375, -0.1737060546875, -0.13018798828125, -0.086669921875, -0.04315185546875, 0.0003662109375, 0.04388427734375, 0.08740234375, 0.13092041015625, 0.1744384765625, 0.21795654296875, 0.261474609375, 0.30499267578125, 0.3485107421875, 0.39202880859375, 0.435546875, 0.47906494140625, 0.5225830078125, 0.56610107421875, 0.609619140625, 0.65313720703125, 0.6966552734375, 0.74017333984375, 0.78369140625, 0.82720947265625, 0.8707275390625, 0.91424560546875, 0.957763671875, 1.00128173828125, 1.0447998046875, 1.08831787109375, 1.1318359375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 0.0, 8.0, 4.0, 6.0, 12.0, 13.0, 19.0, 31.0, 61.0, 222.0, 366.0, 133.0, 54.0, 23.0, 15.0, 9.0, 9.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0002033710479736328, -0.00019907578825950623, -0.00019478052854537964, -0.00019048526883125305, -0.00018619000911712646, -0.00018189474940299988, -0.0001775994896888733, -0.0001733042299747467, -0.00016900897026062012, -0.00016471371054649353, -0.00016041845083236694, -0.00015612319111824036, -0.00015182793140411377, -0.00014753267168998718, -0.0001432374119758606, -0.000138942152261734, -0.00013464689254760742, -0.00013035163283348083, -0.00012605637311935425, -0.00012176111340522766, -0.00011746585369110107, -0.00011317059397697449, -0.0001088753342628479, -0.00010458007454872131, -0.00010028481483459473, -9.598955512046814e-05, -9.169429540634155e-05, -8.739903569221497e-05, -8.310377597808838e-05, -7.880851626396179e-05, -7.45132565498352e-05, -7.021799683570862e-05, -6.592273712158203e-05, -6.162747740745544e-05, -5.733221769332886e-05, -5.303695797920227e-05, -4.8741698265075684e-05, -4.44464385509491e-05, -4.015117883682251e-05, -3.585591912269592e-05, -3.1560659408569336e-05, -2.726539969444275e-05, -2.2970139980316162e-05, -1.8674880266189575e-05, -1.4379620552062988e-05, -1.0084360837936401e-05, -5.7891011238098145e-06, -1.4938414096832275e-06, 2.8014183044433594e-06, 7.096678018569946e-06, 1.1391937732696533e-05, 1.568719744682312e-05, 1.9982457160949707e-05, 2.4277716875076294e-05, 2.857297658920288e-05, 3.286823630332947e-05, 3.7163496017456055e-05, 4.145875573158264e-05, 4.575401544570923e-05, 5.0049275159835815e-05, 5.43445348739624e-05, 5.863979458808899e-05, 6.293505430221558e-05, 6.723031401634216e-05, 7.152557373046875e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 3.0, 11.0, 18.0, 27.0, 38.0, 69.0, 103.0, 203.0, 465.0, 1125.0, 3539.0, 16445.0, 835455.0, 174055.0, 12382.0, 2814.0, 952.0, 408.0, 168.0, 100.0, 62.0, 30.0, 20.0, 23.0, 16.0, 4.0, 6.0, 5.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.10546875, -1.0611114501953125, -1.016754150390625, -0.9723968505859375, -0.92803955078125, -0.8836822509765625, -0.839324951171875, -0.7949676513671875, -0.7506103515625, -0.7062530517578125, -0.661895751953125, -0.6175384521484375, -0.57318115234375, -0.5288238525390625, -0.484466552734375, -0.4401092529296875, -0.395751953125, -0.3513946533203125, -0.307037353515625, -0.2626800537109375, -0.21832275390625, -0.1739654541015625, -0.129608154296875, -0.0852508544921875, -0.0408935546875, 0.0034637451171875, 0.047821044921875, 0.0921783447265625, 0.13653564453125, 0.1808929443359375, 0.225250244140625, 0.2696075439453125, 0.31396484375, 0.3583221435546875, 0.402679443359375, 0.4470367431640625, 0.49139404296875, 0.5357513427734375, 0.580108642578125, 0.6244659423828125, 0.6688232421875, 0.7131805419921875, 0.757537841796875, 0.8018951416015625, 0.84625244140625, 0.8906097412109375, 0.934967041015625, 0.9793243408203125, 1.023681640625, 1.0680389404296875, 1.112396240234375, 1.1567535400390625, 1.20111083984375, 1.2454681396484375, 1.289825439453125, 1.3341827392578125, 1.3785400390625, 1.4228973388671875, 1.467254638671875, 1.5116119384765625, 1.55596923828125, 1.6003265380859375, 1.644683837890625, 1.6890411376953125, 1.7333984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 11.0, 9.0, 8.0, 16.0, 28.0, 38.0, 201.0, 500.0, 66.0, 38.0, 14.0, 19.0, 7.0, 11.0, 5.0, 5.0, 2.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4232063293457031, -0.40915679931640625, -0.3951072692871094, -0.3810577392578125, -0.3670082092285156, -0.35295867919921875, -0.3389091491699219, -0.324859619140625, -0.3108100891113281, -0.29676055908203125, -0.2827110290527344, -0.2686614990234375, -0.2546119689941406, -0.24056243896484375, -0.22651290893554688, -0.21246337890625, -0.19841384887695312, -0.18436431884765625, -0.17031478881835938, -0.1562652587890625, -0.14221572875976562, -0.12816619873046875, -0.11411666870117188, -0.100067138671875, -0.08601760864257812, -0.07196807861328125, -0.057918548583984375, -0.0438690185546875, -0.029819488525390625, -0.01576995849609375, -0.001720428466796875, 0.0123291015625, 0.026378631591796875, 0.04042816162109375, 0.054477691650390625, 0.0685272216796875, 0.08257675170898438, 0.09662628173828125, 0.11067581176757812, 0.124725341796875, 0.13877487182617188, 0.15282440185546875, 0.16687393188476562, 0.1809234619140625, 0.19497299194335938, 0.20902252197265625, 0.22307205200195312, 0.23712158203125, 0.2511711120605469, 0.26522064208984375, 0.2792701721191406, 0.2933197021484375, 0.3073692321777344, 0.32141876220703125, 0.3354682922363281, 0.349517822265625, 0.3635673522949219, 0.37761688232421875, 0.3916664123535156, 0.4057159423828125, 0.4197654724121094, 0.43381500244140625, 0.4478645324707031, 0.4619140625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 14.0, 14.0, 23.0, 44.0, 83.0, 139.0, 162.0, 162.0, 135.0, 96.0, 59.0, 30.0, 15.0, 12.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.257029056549072, -5.961655139923096, -5.666281700134277, -5.370907783508301, -5.075533866882324, -4.780159950256348, -4.484786510467529, -4.189412593841553, -3.8940389156341553, -3.598665237426758, -3.3032913208007812, -3.007917642593384, -2.7125439643859863, -2.4171700477600098, -2.1217963695526123, -1.8264224529266357, -1.5310487747192383, -1.2356749773025513, -0.940301239490509, -0.6449275016784668, -0.3495537042617798, -0.05417990684509277, 0.2411937713623047, 0.5365676879882812, 0.8319413661956787, 1.1273151636123657, 1.4226889610290527, 1.7180626392364502, 2.0134363174438477, 2.308810234069824, 2.6041839122772217, 2.8995578289031982, 3.1949310302734375, 3.490304708480835, 3.7856786251068115, 4.081052303314209, 4.3764262199401855, 4.671799659729004, 4.9671735763549805, 5.262547492980957, 5.557921409606934, 5.85329532623291, 6.1486687660217285, 6.444042682647705, 6.739416599273682, 7.0347900390625, 7.330163955688477, 7.625537872314453, 7.9209113121032715, 8.21628475189209, 8.511658668518066, 8.807032585144043, 9.10240650177002, 9.397780418395996, 9.693153381347656, 9.988527297973633, 10.28390121459961, 10.579275131225586, 10.874649047851562, 11.170022964477539, 11.4653959274292, 11.760769844055176, 12.056143760681152, 12.351517677307129, 12.646891593933105]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 8.0, 8.0, 7.0, 5.0, 15.0, 10.0, 15.0, 18.0, 27.0, 22.0, 22.0, 31.0, 29.0, 38.0, 38.0, 39.0, 34.0, 42.0, 52.0, 51.0, 56.0, 25.0, 39.0, 35.0, 41.0, 36.0, 25.0, 36.0, 31.0, 29.0, 21.0, 23.0, 25.0, 16.0, 15.0, 8.0, 10.0, 9.0, 4.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.087131023406982, -6.861043930053711, -6.6349568367004395, -6.408869743347168, -6.1827826499938965, -5.956695556640625, -5.7306084632873535, -5.504521369934082, -5.2784342765808105, -5.052347183227539, -4.826260089874268, -4.600172996520996, -4.374085903167725, -4.147998809814453, -3.9219117164611816, -3.69582462310791, -3.4697377681732178, -3.2436506748199463, -3.017563581466675, -2.7914764881134033, -2.565389394760132, -2.3393025398254395, -2.113215446472168, -1.887128233909607, -1.6610411405563354, -1.434954047203064, -1.2088669538497925, -0.9827799201011658, -0.7566928267478943, -0.5306057929992676, -0.3045186996459961, -0.07843160629272461, 0.14765548706054688, 0.37374258041381836, 0.5998296737670898, 0.8259167075157166, 1.0520038604736328, 1.2780908346176147, 1.5041779279708862, 1.7302650213241577, 1.9563521146774292, 2.182439088821411, 2.4085261821746826, 2.634613275527954, 2.8607003688812256, 3.086787462234497, 3.3128745555877686, 3.53896164894104, 3.7650487422943115, 3.991135835647583, 4.217222690582275, 4.443309783935547, 4.669396877288818, 4.89548397064209, 5.121571063995361, 5.347658157348633, 5.573745250701904, 5.799832344055176, 6.025919437408447, 6.252006530761719, 6.47809362411499, 6.704180717468262, 6.930267810821533, 7.156354904174805, 7.382441997528076]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 5.0, 5.0, 10.0, 12.0, 16.0, 17.0, 17.0, 36.0, 57.0, 77.0, 133.0, 220.0, 382.0, 783.0, 1745.0, 4996.0, 18268.0, 132900.0, 2518501.0, 1419959.0, 76658.0, 13009.0, 3794.0, 1329.0, 597.0, 283.0, 160.0, 110.0, 61.0, 40.0, 30.0, 19.0, 15.0, 9.0, 7.0, 9.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.73828125, -5.56890869140625, -5.3995361328125, -5.23016357421875, -5.060791015625, -4.89141845703125, -4.7220458984375, -4.55267333984375, -4.38330078125, -4.21392822265625, -4.0445556640625, -3.87518310546875, -3.705810546875, -3.53643798828125, -3.3670654296875, -3.19769287109375, -3.0283203125, -2.85894775390625, -2.6895751953125, -2.52020263671875, -2.350830078125, -2.18145751953125, -2.0120849609375, -1.84271240234375, -1.67333984375, -1.50396728515625, -1.3345947265625, -1.16522216796875, -0.995849609375, -0.82647705078125, -0.6571044921875, -0.48773193359375, -0.318359375, -0.14898681640625, 0.0203857421875, 0.18975830078125, 0.359130859375, 0.52850341796875, 0.6978759765625, 0.86724853515625, 1.03662109375, 1.20599365234375, 1.3753662109375, 1.54473876953125, 1.714111328125, 1.88348388671875, 2.0528564453125, 2.22222900390625, 2.3916015625, 2.56097412109375, 2.7303466796875, 2.89971923828125, 3.069091796875, 3.23846435546875, 3.4078369140625, 3.57720947265625, 3.74658203125, 3.91595458984375, 4.0853271484375, 4.25469970703125, 4.424072265625, 4.59344482421875, 4.7628173828125, 4.93218994140625, 5.1015625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 7.0, 12.0, 5.0, 8.0, 18.0, 20.0, 28.0, 20.0, 30.0, 35.0, 42.0, 31.0, 54.0, 43.0, 32.0, 48.0, 50.0, 65.0, 53.0, 64.0, 52.0, 28.0, 41.0, 22.0, 35.0, 18.0, 38.0, 18.0, 18.0, 12.0, 11.0, 5.0, 4.0, 7.0, 5.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.31640625, -2.251708984375, -2.18701171875, -2.122314453125, -2.0576171875, -1.992919921875, -1.92822265625, -1.863525390625, -1.798828125, -1.734130859375, -1.66943359375, -1.604736328125, -1.5400390625, -1.475341796875, -1.41064453125, -1.345947265625, -1.28125, -1.216552734375, -1.15185546875, -1.087158203125, -1.0224609375, -0.957763671875, -0.89306640625, -0.828369140625, -0.763671875, -0.698974609375, -0.63427734375, -0.569580078125, -0.5048828125, -0.440185546875, -0.37548828125, -0.310791015625, -0.24609375, -0.181396484375, -0.11669921875, -0.052001953125, 0.0126953125, 0.077392578125, 0.14208984375, 0.206787109375, 0.271484375, 0.336181640625, 0.40087890625, 0.465576171875, 0.5302734375, 0.594970703125, 0.65966796875, 0.724365234375, 0.7890625, 0.853759765625, 0.91845703125, 0.983154296875, 1.0478515625, 1.112548828125, 1.17724609375, 1.241943359375, 1.306640625, 1.371337890625, 1.43603515625, 1.500732421875, 1.5654296875, 1.630126953125, 1.69482421875, 1.759521484375, 1.82421875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 13.0, 9.0, 32.0, 31.0, 60.0, 95.0, 150.0, 244.0, 520.0, 1265.0, 3054.0, 10343.0, 62622.0, 1880409.0, 2152425.0, 67496.0, 10202.0, 2958.0, 1173.0, 539.0, 244.0, 141.0, 74.0, 53.0, 31.0, 21.0, 18.0, 7.0, 8.0, 5.0, 3.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.6640625, -6.5015869140625, -6.339111328125, -6.1766357421875, -6.01416015625, -5.8516845703125, -5.689208984375, -5.5267333984375, -5.3642578125, -5.2017822265625, -5.039306640625, -4.8768310546875, -4.71435546875, -4.5518798828125, -4.389404296875, -4.2269287109375, -4.064453125, -3.9019775390625, -3.739501953125, -3.5770263671875, -3.41455078125, -3.2520751953125, -3.089599609375, -2.9271240234375, -2.7646484375, -2.6021728515625, -2.439697265625, -2.2772216796875, -2.11474609375, -1.9522705078125, -1.789794921875, -1.6273193359375, -1.46484375, -1.3023681640625, -1.139892578125, -0.9774169921875, -0.81494140625, -0.6524658203125, -0.489990234375, -0.3275146484375, -0.1650390625, -0.0025634765625, 0.159912109375, 0.3223876953125, 0.48486328125, 0.6473388671875, 0.809814453125, 0.9722900390625, 1.134765625, 1.2972412109375, 1.459716796875, 1.6221923828125, 1.78466796875, 1.9471435546875, 2.109619140625, 2.2720947265625, 2.4345703125, 2.5970458984375, 2.759521484375, 2.9219970703125, 3.08447265625, 3.2469482421875, 3.409423828125, 3.5718994140625, 3.734375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 0.0, 8.0, 8.0, 12.0, 22.0, 22.0, 40.0, 37.0, 73.0, 95.0, 160.0, 276.0, 458.0, 656.0, 746.0, 560.0, 298.0, 195.0, 115.0, 91.0, 57.0, 41.0, 31.0, 18.0, 8.0, 9.0, 4.0, 7.0, 6.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.984710693359375, -0.94403076171875, -0.903350830078125, -0.8626708984375, -0.821990966796875, -0.78131103515625, -0.740631103515625, -0.699951171875, -0.659271240234375, -0.61859130859375, -0.577911376953125, -0.5372314453125, -0.496551513671875, -0.45587158203125, -0.415191650390625, -0.37451171875, -0.333831787109375, -0.29315185546875, -0.252471923828125, -0.2117919921875, -0.171112060546875, -0.13043212890625, -0.089752197265625, -0.049072265625, -0.008392333984375, 0.03228759765625, 0.072967529296875, 0.1136474609375, 0.154327392578125, 0.19500732421875, 0.235687255859375, 0.2763671875, 0.317047119140625, 0.35772705078125, 0.398406982421875, 0.4390869140625, 0.479766845703125, 0.52044677734375, 0.561126708984375, 0.601806640625, 0.642486572265625, 0.68316650390625, 0.723846435546875, 0.7645263671875, 0.805206298828125, 0.84588623046875, 0.886566162109375, 0.92724609375, 0.967926025390625, 1.00860595703125, 1.049285888671875, 1.0899658203125, 1.130645751953125, 1.17132568359375, 1.212005615234375, 1.252685546875, 1.293365478515625, 1.33404541015625, 1.374725341796875, 1.4154052734375, 1.456085205078125, 1.49676513671875, 1.537445068359375, 1.578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 23.0, 25.0, 34.0, 52.0, 64.0, 101.0, 88.0, 114.0, 110.0, 82.0, 79.0, 56.0, 48.0, 31.0, 23.0, 20.0, 14.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.406394004821777, -6.252882957458496, -6.099371433258057, -5.945860385894775, -5.792349338531494, -5.638837814331055, -5.485326766967773, -5.331815719604492, -5.178304195404053, -5.0247931480407715, -4.871281623840332, -4.717770576477051, -4.5642595291137695, -4.41074800491333, -4.257236957550049, -4.103725433349609, -3.9502146244049072, -3.796703338623047, -3.6431922912597656, -3.4896810054779053, -3.336169719696045, -3.1826586723327637, -3.0291473865509033, -2.875636100769043, -2.7221250534057617, -2.5686137676239014, -2.41510272026062, -2.2615914344787598, -2.1080801486968994, -1.9545689821243286, -1.8010578155517578, -1.6475465297698975, -1.4940354824066162, -1.3405243158340454, -1.187013030052185, -1.0335018634796143, -0.8799906373023987, -0.7264794111251831, -0.5729682445526123, -0.41945695877075195, -0.26594579219818115, -0.11243458092212677, 0.04107663035392761, 0.1945878267288208, 0.3480990529060364, 0.501610279083252, 0.6551214456558228, 0.8086327314376831, 0.9621438980102539, 1.1156550645828247, 1.269166350364685, 1.4226775169372559, 1.5761888027191162, 1.729699969291687, 1.8832111358642578, 2.036722421646118, 2.1902337074279785, 2.343744993209839, 2.49725604057312, 2.6507673263549805, 2.804278612136841, 2.957789897918701, 3.1113009452819824, 3.2648122310638428, 3.418323278427124]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 6.0, 9.0, 10.0, 4.0, 8.0, 12.0, 8.0, 14.0, 11.0, 29.0, 25.0, 32.0, 34.0, 39.0, 47.0, 46.0, 55.0, 49.0, 48.0, 50.0, 50.0, 46.0, 45.0, 50.0, 42.0, 45.0, 36.0, 26.0, 27.0, 24.0, 21.0, 10.0, 10.0, 10.0, 5.0, 8.0, 1.0, 3.0, 1.0, 6.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8059191703796387, -2.7161920070648193, -2.626465082168579, -2.5367379188537598, -2.4470109939575195, -2.3572838306427, -2.267556667327881, -2.1778297424316406, -2.0881025791168213, -1.9983755350112915, -1.9086484909057617, -1.8189213275909424, -1.7291942834854126, -1.6394672393798828, -1.549740195274353, -1.4600131511688232, -1.3702861070632935, -1.2805590629577637, -1.1908320188522339, -1.101104974746704, -1.0113778114318848, -0.921650767326355, -0.8319237232208252, -0.7421966195106506, -0.6524695754051208, -0.5627425312995911, -0.4730154275894165, -0.3832883834838867, -0.29356130957603455, -0.20383423566818237, -0.11410719156265259, -0.024380087852478027, 0.06534695625305176, 0.15507403016090393, 0.2448010891675949, 0.3345281481742859, 0.42425522208213806, 0.5139822959899902, 0.60370934009552, 0.6934364438056946, 0.7831634879112244, 0.8728905320167542, 0.9626176357269287, 1.0523446798324585, 1.1420717239379883, 1.2317988872528076, 1.3215258121490479, 1.4112529754638672, 1.500980019569397, 1.5907070636749268, 1.6804341077804565, 1.7701611518859863, 1.8598883152008057, 1.9496153593063354, 2.0393424034118652, 2.1290695667266846, 2.218796491622925, 2.308523654937744, 2.3982505798339844, 2.4879777431488037, 2.577704668045044, 2.6674318313598633, 2.7571587562561035, 2.846885919570923, 2.936613082885742]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 11.0, 13.0, 23.0, 34.0, 52.0, 79.0, 110.0, 179.0, 288.0, 534.0, 953.0, 1874.0, 3938.0, 9831.0, 27823.0, 108358.0, 558331.0, 256895.0, 51674.0, 15742.0, 6046.0, 2621.0, 1342.0, 708.0, 431.0, 231.0, 143.0, 82.0, 69.0, 37.0, 32.0, 23.0, 9.0, 4.0, 11.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.56689453125, -0.5478363037109375, -0.528778076171875, -0.5097198486328125, -0.49066162109375, -0.4716033935546875, -0.452545166015625, -0.4334869384765625, -0.4144287109375, -0.3953704833984375, -0.376312255859375, -0.3572540283203125, -0.33819580078125, -0.3191375732421875, -0.300079345703125, -0.2810211181640625, -0.261962890625, -0.2429046630859375, -0.223846435546875, -0.2047882080078125, -0.18572998046875, -0.1666717529296875, -0.147613525390625, -0.1285552978515625, -0.1094970703125, -0.0904388427734375, -0.071380615234375, -0.0523223876953125, -0.03326416015625, -0.0142059326171875, 0.004852294921875, 0.0239105224609375, 0.04296875, 0.0620269775390625, 0.081085205078125, 0.1001434326171875, 0.11920166015625, 0.1382598876953125, 0.157318115234375, 0.1763763427734375, 0.1954345703125, 0.2144927978515625, 0.233551025390625, 0.2526092529296875, 0.27166748046875, 0.2907257080078125, 0.309783935546875, 0.3288421630859375, 0.347900390625, 0.3669586181640625, 0.386016845703125, 0.4050750732421875, 0.42413330078125, 0.4431915283203125, 0.462249755859375, 0.4813079833984375, 0.5003662109375, 0.5194244384765625, 0.538482666015625, 0.5575408935546875, 0.57659912109375, 0.5956573486328125, 0.614715576171875, 0.6337738037109375, 0.65283203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 7.0, 13.0, 9.0, 15.0, 22.0, 23.0, 39.0, 41.0, 39.0, 71.0, 70.0, 71.0, 72.0, 78.0, 56.0, 69.0, 61.0, 64.0, 49.0, 32.0, 27.0, 31.0, 12.0, 7.0, 2.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.193359375, -2.11181640625, -2.0302734375, -1.94873046875, -1.8671875, -1.78564453125, -1.7041015625, -1.62255859375, -1.541015625, -1.45947265625, -1.3779296875, -1.29638671875, -1.21484375, -1.13330078125, -1.0517578125, -0.97021484375, -0.888671875, -0.80712890625, -0.7255859375, -0.64404296875, -0.5625, -0.48095703125, -0.3994140625, -0.31787109375, -0.236328125, -0.15478515625, -0.0732421875, 0.00830078125, 0.08984375, 0.17138671875, 0.2529296875, 0.33447265625, 0.416015625, 0.49755859375, 0.5791015625, 0.66064453125, 0.7421875, 0.82373046875, 0.9052734375, 0.98681640625, 1.068359375, 1.14990234375, 1.2314453125, 1.31298828125, 1.39453125, 1.47607421875, 1.5576171875, 1.63916015625, 1.720703125, 1.80224609375, 1.8837890625, 1.96533203125, 2.046875, 2.12841796875, 2.2099609375, 2.29150390625, 2.373046875, 2.45458984375, 2.5361328125, 2.61767578125, 2.69921875, 2.78076171875, 2.8623046875, 2.94384765625, 3.025390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 8.0, 18.0, 24.0, 32.0, 62.0, 94.0, 114.0, 209.0, 303.0, 502.0, 803.0, 1412.0, 2597.0, 4914.0, 9577.0, 19225.0, 42599.0, 104091.0, 295398.0, 347028.0, 125189.0, 49455.0, 21983.0, 10636.0, 5319.0, 2884.0, 1597.0, 930.0, 572.0, 329.0, 204.0, 142.0, 102.0, 61.0, 33.0, 34.0, 28.0, 10.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.256591796875, -0.24906539916992188, -0.24153900146484375, -0.23401260375976562, -0.2264862060546875, -0.21895980834960938, -0.21143341064453125, -0.20390701293945312, -0.196380615234375, -0.18885421752929688, -0.18132781982421875, -0.17380142211914062, -0.1662750244140625, -0.15874862670898438, -0.15122222900390625, -0.14369583129882812, -0.13616943359375, -0.12864303588867188, -0.12111663818359375, -0.11359024047851562, -0.1060638427734375, -0.09853744506835938, -0.09101104736328125, -0.08348464965820312, -0.075958251953125, -0.06843185424804688, -0.06090545654296875, -0.053379058837890625, -0.0458526611328125, -0.038326263427734375, -0.03079986572265625, -0.023273468017578125, -0.0157470703125, -0.008220672607421875, -0.00069427490234375, 0.006832122802734375, 0.0143585205078125, 0.021884918212890625, 0.02941131591796875, 0.036937713623046875, 0.044464111328125, 0.051990509033203125, 0.05951690673828125, 0.06704330444335938, 0.0745697021484375, 0.08209609985351562, 0.08962249755859375, 0.09714889526367188, 0.10467529296875, 0.11220169067382812, 0.11972808837890625, 0.12725448608398438, 0.1347808837890625, 0.14230728149414062, 0.14983367919921875, 0.15736007690429688, 0.164886474609375, 0.17241287231445312, 0.17993927001953125, 0.18746566772460938, 0.1949920654296875, 0.20251846313476562, 0.21004486083984375, 0.21757125854492188, 0.22509765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 7.0, 7.0, 11.0, 9.0, 19.0, 23.0, 17.0, 28.0, 34.0, 37.0, 33.0, 37.0, 45.0, 37.0, 46.0, 62.0, 43.0, 50.0, 42.0, 46.0, 42.0, 41.0, 38.0, 29.0, 31.0, 30.0, 26.0, 19.0, 25.0, 13.0, 10.0, 13.0, 11.0, 9.0, 1.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.84765625, -3.739593505859375, -3.63153076171875, -3.523468017578125, -3.4154052734375, -3.307342529296875, -3.19927978515625, -3.091217041015625, -2.983154296875, -2.875091552734375, -2.76702880859375, -2.658966064453125, -2.5509033203125, -2.442840576171875, -2.33477783203125, -2.226715087890625, -2.11865234375, -2.010589599609375, -1.90252685546875, -1.794464111328125, -1.6864013671875, -1.578338623046875, -1.47027587890625, -1.362213134765625, -1.254150390625, -1.146087646484375, -1.03802490234375, -0.929962158203125, -0.8218994140625, -0.713836669921875, -0.60577392578125, -0.497711181640625, -0.3896484375, -0.281585693359375, -0.17352294921875, -0.065460205078125, 0.0426025390625, 0.150665283203125, 0.25872802734375, 0.366790771484375, 0.474853515625, 0.582916259765625, 0.69097900390625, 0.799041748046875, 0.9071044921875, 1.015167236328125, 1.12322998046875, 1.231292724609375, 1.33935546875, 1.447418212890625, 1.55548095703125, 1.663543701171875, 1.7716064453125, 1.879669189453125, 1.98773193359375, 2.095794677734375, 2.203857421875, 2.311920166015625, 2.41998291015625, 2.528045654296875, 2.6361083984375, 2.744171142578125, 2.85223388671875, 2.960296630859375, 3.068359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 10.0, 16.0, 28.0, 38.0, 73.0, 123.0, 249.0, 543.0, 1731.0, 7492.0, 59350.0, 822992.0, 138829.0, 12880.0, 2544.0, 759.0, 353.0, 200.0, 101.0, 74.0, 54.0, 33.0, 23.0, 15.0, 13.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09820556640625, -0.0951986312866211, -0.09219169616699219, -0.08918476104736328, -0.08617782592773438, -0.08317089080810547, -0.08016395568847656, -0.07715702056884766, -0.07415008544921875, -0.07114315032958984, -0.06813621520996094, -0.06512928009033203, -0.062122344970703125, -0.05911540985107422, -0.05610847473144531, -0.053101539611816406, -0.0500946044921875, -0.047087669372558594, -0.04408073425292969, -0.04107379913330078, -0.038066864013671875, -0.03505992889404297, -0.03205299377441406, -0.029046058654785156, -0.02603912353515625, -0.023032188415527344, -0.020025253295898438, -0.01701831817626953, -0.014011383056640625, -0.011004447937011719, -0.007997512817382812, -0.004990577697753906, -0.001983642578125, 0.0010232925415039062, 0.0040302276611328125, 0.007037162780761719, 0.010044097900390625, 0.013051033020019531, 0.016057968139648438, 0.019064903259277344, 0.02207183837890625, 0.025078773498535156, 0.028085708618164062, 0.03109264373779297, 0.034099578857421875, 0.03710651397705078, 0.04011344909667969, 0.043120384216308594, 0.0461273193359375, 0.049134254455566406, 0.05214118957519531, 0.05514812469482422, 0.058155059814453125, 0.06116199493408203, 0.06416893005371094, 0.06717586517333984, 0.07018280029296875, 0.07318973541259766, 0.07619667053222656, 0.07920360565185547, 0.08221054077148438, 0.08521747589111328, 0.08822441101074219, 0.0912313461303711, 0.09423828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 6.0, 10.0, 4.0, 8.0, 10.0, 14.0, 15.0, 16.0, 31.0, 23.0, 53.0, 59.0, 73.0, 72.0, 71.0, 77.0, 83.0, 77.0, 69.0, 51.0, 40.0, 31.0, 24.0, 16.0, 17.0, 11.0, 9.0, 7.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.427267074584961e-05, -3.3280812203884125e-05, -3.228895366191864e-05, -3.1297095119953156e-05, -3.030523657798767e-05, -2.9313378036022186e-05, -2.83215194940567e-05, -2.7329660952091217e-05, -2.6337802410125732e-05, -2.5345943868160248e-05, -2.4354085326194763e-05, -2.336222678422928e-05, -2.2370368242263794e-05, -2.137850970029831e-05, -2.0386651158332825e-05, -1.939479261636734e-05, -1.8402934074401855e-05, -1.741107553243637e-05, -1.6419216990470886e-05, -1.54273584485054e-05, -1.4435499906539917e-05, -1.3443641364574432e-05, -1.2451782822608948e-05, -1.1459924280643463e-05, -1.0468065738677979e-05, -9.476207196712494e-06, -8.48434865474701e-06, -7.492490112781525e-06, -6.50063157081604e-06, -5.508773028850555e-06, -4.516914486885071e-06, -3.525055944919586e-06, -2.5331974029541016e-06, -1.541338860988617e-06, -5.494803190231323e-07, 4.423782229423523e-07, 1.434236764907837e-06, 2.4260953068733215e-06, 3.417953848838806e-06, 4.409812390804291e-06, 5.401670932769775e-06, 6.39352947473526e-06, 7.385388016700745e-06, 8.37724655866623e-06, 9.369105100631714e-06, 1.0360963642597198e-05, 1.1352822184562683e-05, 1.2344680726528168e-05, 1.3336539268493652e-05, 1.4328397810459137e-05, 1.532025635242462e-05, 1.6312114894390106e-05, 1.730397343635559e-05, 1.8295831978321075e-05, 1.928769052028656e-05, 2.0279549062252045e-05, 2.127140760421753e-05, 2.2263266146183014e-05, 2.32551246881485e-05, 2.4246983230113983e-05, 2.5238841772079468e-05, 2.6230700314044952e-05, 2.7222558856010437e-05, 2.821441739797592e-05, 2.9206275939941406e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 8.0, 13.0, 18.0, 28.0, 33.0, 65.0, 103.0, 179.0, 299.0, 537.0, 1003.0, 2011.0, 4484.0, 10948.0, 31940.0, 132031.0, 666222.0, 144158.0, 34166.0, 11208.0, 4545.0, 2049.0, 1091.0, 587.0, 314.0, 163.0, 109.0, 70.0, 48.0, 31.0, 24.0, 11.0, 15.0, 5.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.057373046875, -0.05549335479736328, -0.05361366271972656, -0.051733970642089844, -0.049854278564453125, -0.047974586486816406, -0.04609489440917969, -0.04421520233154297, -0.04233551025390625, -0.04045581817626953, -0.03857612609863281, -0.036696434020996094, -0.034816741943359375, -0.032937049865722656, -0.031057357788085938, -0.02917766571044922, -0.0272979736328125, -0.02541828155517578, -0.023538589477539062, -0.021658897399902344, -0.019779205322265625, -0.017899513244628906, -0.016019821166992188, -0.014140129089355469, -0.01226043701171875, -0.010380744934082031, -0.008501052856445312, -0.006621360778808594, -0.004741668701171875, -0.0028619766235351562, -0.0009822845458984375, 0.0008974075317382812, 0.002777099609375, 0.004656791687011719, 0.0065364837646484375, 0.008416175842285156, 0.010295867919921875, 0.012175559997558594, 0.014055252075195312, 0.01593494415283203, 0.01781463623046875, 0.01969432830810547, 0.021574020385742188, 0.023453712463378906, 0.025333404541015625, 0.027213096618652344, 0.029092788696289062, 0.03097248077392578, 0.0328521728515625, 0.03473186492919922, 0.03661155700683594, 0.038491249084472656, 0.040370941162109375, 0.042250633239746094, 0.04413032531738281, 0.04601001739501953, 0.04788970947265625, 0.04976940155029297, 0.05164909362792969, 0.053528785705566406, 0.055408477783203125, 0.057288169860839844, 0.05916786193847656, 0.06104755401611328, 0.06292724609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 5.0, 15.0, 11.0, 9.0, 12.0, 10.0, 12.0, 16.0, 29.0, 39.0, 49.0, 55.0, 87.0, 171.0, 140.0, 94.0, 70.0, 48.0, 22.0, 23.0, 18.0, 17.0, 14.0, 8.0, 8.0, 2.0, 7.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01386260986328125, -0.013383030891418457, -0.012903451919555664, -0.012423872947692871, -0.011944293975830078, -0.011464715003967285, -0.010985136032104492, -0.0105055570602417, -0.010025978088378906, -0.009546399116516113, -0.00906682014465332, -0.008587241172790527, -0.008107662200927734, -0.007628083229064941, -0.0071485042572021484, -0.0066689252853393555, -0.0061893463134765625, -0.0057097673416137695, -0.0052301883697509766, -0.004750609397888184, -0.004271030426025391, -0.0037914514541625977, -0.0033118724822998047, -0.0028322935104370117, -0.0023527145385742188, -0.0018731355667114258, -0.0013935565948486328, -0.0009139776229858398, -0.0004343986511230469, 4.5180320739746094e-05, 0.0005247592926025391, 0.001004338264465332, 0.001483917236328125, 0.001963496208190918, 0.002443075180053711, 0.002922654151916504, 0.003402233123779297, 0.00388181209564209, 0.004361391067504883, 0.004840970039367676, 0.005320549011230469, 0.005800127983093262, 0.006279706954956055, 0.006759285926818848, 0.007238864898681641, 0.007718443870544434, 0.008198022842407227, 0.00867760181427002, 0.009157180786132812, 0.009636759757995605, 0.010116338729858398, 0.010595917701721191, 0.011075496673583984, 0.011555075645446777, 0.01203465461730957, 0.012514233589172363, 0.012993812561035156, 0.01347339153289795, 0.013952970504760742, 0.014432549476623535, 0.014912128448486328, 0.015391707420349121, 0.015871286392211914, 0.016350865364074707, 0.0168304443359375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 10.0, 15.0, 39.0, 46.0, 77.0, 124.0, 151.0, 132.0, 133.0, 100.0, 63.0, 51.0, 24.0, 20.0, 10.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.755821228027344, -4.631500720977783, -4.507180213928223, -4.382859706878662, -4.258539199829102, -4.134218692779541, -4.0098981857299805, -3.88557767868042, -3.7612571716308594, -3.636936664581299, -3.5126161575317383, -3.3882956504821777, -3.263975143432617, -3.1396546363830566, -3.015334129333496, -2.8910136222839355, -2.766693115234375, -2.6423726081848145, -2.518052101135254, -2.3937315940856934, -2.269411087036133, -2.1450905799865723, -2.0207700729370117, -1.8964495658874512, -1.7721290588378906, -1.64780855178833, -1.5234880447387695, -1.399167537689209, -1.2748470306396484, -1.150526523590088, -1.0262060165405273, -0.9018855094909668, -0.7775650024414062, -0.6532444953918457, -0.5289239883422852, -0.4046034812927246, -0.28028297424316406, -0.15596246719360352, -0.03164196014404297, 0.09267854690551758, 0.21699905395507812, 0.34131956100463867, 0.4656400680541992, 0.5899605751037598, 0.7142810821533203, 0.8386015892028809, 0.9629220962524414, 1.087242603302002, 1.2115631103515625, 1.335883617401123, 1.4602041244506836, 1.5845246315002441, 1.7088451385498047, 1.8331656455993652, 1.9574861526489258, 2.0818066596984863, 2.206127166748047, 2.3304476737976074, 2.454768180847168, 2.5790886878967285, 2.703409194946289, 2.8277297019958496, 2.95205020904541, 3.0763707160949707, 3.2006912231445312]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 11.0, 9.0, 14.0, 14.0, 14.0, 29.0, 38.0, 43.0, 42.0, 68.0, 65.0, 81.0, 68.0, 66.0, 70.0, 64.0, 61.0, 62.0, 44.0, 37.0, 30.0, 23.0, 12.0, 9.0, 7.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9833922386169434, -1.9069877862930298, -1.8305833339691162, -1.7541788816452026, -1.677774429321289, -1.6013699769973755, -1.524965524673462, -1.4485610723495483, -1.3721566200256348, -1.2957521677017212, -1.2193477153778076, -1.142943263053894, -1.0665388107299805, -0.9901343584060669, -0.9137299060821533, -0.8373254537582397, -0.7609210014343262, -0.6845165491104126, -0.608112096786499, -0.5317076444625854, -0.4553031921386719, -0.3788987398147583, -0.3024942874908447, -0.22608983516693115, -0.14968538284301758, -0.073280930519104, 0.0031235218048095703, 0.07952797412872314, 0.15593242645263672, 0.2323368787765503, 0.30874133110046387, 0.38514578342437744, 0.461550235748291, 0.5379546880722046, 0.6143591403961182, 0.6907635927200317, 0.7671680450439453, 0.8435724973678589, 0.9199769496917725, 0.996381402015686, 1.0727858543395996, 1.1491903066635132, 1.2255947589874268, 1.3019992113113403, 1.378403663635254, 1.4548081159591675, 1.531212568283081, 1.6076170206069946, 1.6840214729309082, 1.7604259252548218, 1.8368303775787354, 1.913234829902649, 1.9896392822265625, 2.0660438537597656, 2.1424481868743896, 2.2188525199890137, 2.295257091522217, 2.37166166305542, 2.448065996170044, 2.524470329284668, 2.600874900817871, 2.677279472351074, 2.7536838054656982, 2.8300881385803223, 2.9064927101135254]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 11.0, 18.0, 29.0, 45.0, 58.0, 96.0, 145.0, 288.0, 551.0, 1136.0, 2412.0, 5392.0, 12855.0, 35771.0, 178495.0, 675172.0, 93283.0, 25125.0, 9726.0, 4208.0, 1764.0, 903.0, 450.0, 245.0, 142.0, 83.0, 39.0, 37.0, 26.0, 13.0, 13.0, 5.0, 8.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.087890625, -2.019073486328125, -1.95025634765625, -1.881439208984375, -1.8126220703125, -1.743804931640625, -1.67498779296875, -1.606170654296875, -1.537353515625, -1.468536376953125, -1.39971923828125, -1.330902099609375, -1.2620849609375, -1.193267822265625, -1.12445068359375, -1.055633544921875, -0.98681640625, -0.917999267578125, -0.84918212890625, -0.780364990234375, -0.7115478515625, -0.642730712890625, -0.57391357421875, -0.505096435546875, -0.436279296875, -0.367462158203125, -0.29864501953125, -0.229827880859375, -0.1610107421875, -0.092193603515625, -0.02337646484375, 0.045440673828125, 0.1142578125, 0.183074951171875, 0.25189208984375, 0.320709228515625, 0.3895263671875, 0.458343505859375, 0.52716064453125, 0.595977783203125, 0.664794921875, 0.733612060546875, 0.80242919921875, 0.871246337890625, 0.9400634765625, 1.008880615234375, 1.07769775390625, 1.146514892578125, 1.21533203125, 1.284149169921875, 1.35296630859375, 1.421783447265625, 1.4906005859375, 1.559417724609375, 1.62823486328125, 1.697052001953125, 1.765869140625, 1.834686279296875, 1.90350341796875, 1.972320556640625, 2.0411376953125, 2.109954833984375, 2.17877197265625, 2.247589111328125, 2.31640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 5.0, 6.0, 10.0, 6.0, 14.0, 15.0, 18.0, 20.0, 28.0, 25.0, 45.0, 38.0, 34.0, 55.0, 39.0, 54.0, 49.0, 48.0, 44.0, 44.0, 46.0, 52.0, 39.0, 49.0, 29.0, 34.0, 28.0, 26.0, 17.0, 15.0, 10.0, 11.0, 7.0, 2.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.3209228515625, -3.218017578125, -3.1151123046875, -3.01220703125, -2.9093017578125, -2.806396484375, -2.7034912109375, -2.6005859375, -2.4976806640625, -2.394775390625, -2.2918701171875, -2.18896484375, -2.0860595703125, -1.983154296875, -1.8802490234375, -1.77734375, -1.6744384765625, -1.571533203125, -1.4686279296875, -1.36572265625, -1.2628173828125, -1.159912109375, -1.0570068359375, -0.9541015625, -0.8511962890625, -0.748291015625, -0.6453857421875, -0.54248046875, -0.4395751953125, -0.336669921875, -0.2337646484375, -0.130859375, -0.0279541015625, 0.074951171875, 0.1778564453125, 0.28076171875, 0.3836669921875, 0.486572265625, 0.5894775390625, 0.6923828125, 0.7952880859375, 0.898193359375, 1.0010986328125, 1.10400390625, 1.2069091796875, 1.309814453125, 1.4127197265625, 1.515625, 1.6185302734375, 1.721435546875, 1.8243408203125, 1.92724609375, 2.0301513671875, 2.133056640625, 2.2359619140625, 2.3388671875, 2.4417724609375, 2.544677734375, 2.6475830078125, 2.75048828125, 2.8533935546875, 2.956298828125, 3.0592041015625, 3.162109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 4.0, 7.0, 11.0, 18.0, 9.0, 12.0, 13.0, 35.0, 39.0, 56.0, 79.0, 112.0, 205.0, 402.0, 1117.0, 5549.0, 49055.0, 934554.0, 49502.0, 5547.0, 1143.0, 426.0, 202.0, 115.0, 74.0, 46.0, 49.0, 30.0, 30.0, 18.0, 20.0, 15.0, 4.0, 7.0, 10.0, 7.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.391357421875, -5.22021484375, -5.049072265625, -4.8779296875, -4.706787109375, -4.53564453125, -4.364501953125, -4.193359375, -4.022216796875, -3.85107421875, -3.679931640625, -3.5087890625, -3.337646484375, -3.16650390625, -2.995361328125, -2.82421875, -2.653076171875, -2.48193359375, -2.310791015625, -2.1396484375, -1.968505859375, -1.79736328125, -1.626220703125, -1.455078125, -1.283935546875, -1.11279296875, -0.941650390625, -0.7705078125, -0.599365234375, -0.42822265625, -0.257080078125, -0.0859375, 0.085205078125, 0.25634765625, 0.427490234375, 0.5986328125, 0.769775390625, 0.94091796875, 1.112060546875, 1.283203125, 1.454345703125, 1.62548828125, 1.796630859375, 1.9677734375, 2.138916015625, 2.31005859375, 2.481201171875, 2.65234375, 2.823486328125, 2.99462890625, 3.165771484375, 3.3369140625, 3.508056640625, 3.67919921875, 3.850341796875, 4.021484375, 4.192626953125, 4.36376953125, 4.534912109375, 4.7060546875, 4.877197265625, 5.04833984375, 5.219482421875, 5.390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 4.0, 13.0, 6.0, 9.0, 21.0, 14.0, 16.0, 19.0, 24.0, 32.0, 20.0, 43.0, 50.0, 56.0, 48.0, 53.0, 55.0, 62.0, 50.0, 48.0, 46.0, 39.0, 33.0, 30.0, 32.0, 33.0, 28.0, 26.0, 17.0, 16.0, 5.0, 9.0, 7.0, 4.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.65625, -3.52862548828125, -3.4010009765625, -3.27337646484375, -3.145751953125, -3.01812744140625, -2.8905029296875, -2.76287841796875, -2.63525390625, -2.50762939453125, -2.3800048828125, -2.25238037109375, -2.124755859375, -1.99713134765625, -1.8695068359375, -1.74188232421875, -1.6142578125, -1.48663330078125, -1.3590087890625, -1.23138427734375, -1.103759765625, -0.97613525390625, -0.8485107421875, -0.72088623046875, -0.59326171875, -0.46563720703125, -0.3380126953125, -0.21038818359375, -0.082763671875, 0.04486083984375, 0.1724853515625, 0.30010986328125, 0.427734375, 0.55535888671875, 0.6829833984375, 0.81060791015625, 0.938232421875, 1.06585693359375, 1.1934814453125, 1.32110595703125, 1.44873046875, 1.57635498046875, 1.7039794921875, 1.83160400390625, 1.959228515625, 2.08685302734375, 2.2144775390625, 2.34210205078125, 2.4697265625, 2.59735107421875, 2.7249755859375, 2.85260009765625, 2.980224609375, 3.10784912109375, 3.2354736328125, 3.36309814453125, 3.49072265625, 3.61834716796875, 3.7459716796875, 3.87359619140625, 4.001220703125, 4.12884521484375, 4.2564697265625, 4.38409423828125, 4.51171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 7.0, 7.0, 16.0, 19.0, 39.0, 67.0, 130.0, 244.0, 538.0, 1361.0, 4935.0, 23298.0, 369509.0, 615815.0, 24926.0, 5115.0, 1435.0, 518.0, 246.0, 135.0, 70.0, 40.0, 22.0, 21.0, 9.0, 1.0, 3.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.21875, -1.1866912841796875, -1.154632568359375, -1.1225738525390625, -1.09051513671875, -1.0584564208984375, -1.026397705078125, -0.9943389892578125, -0.9622802734375, -0.9302215576171875, -0.898162841796875, -0.8661041259765625, -0.83404541015625, -0.8019866943359375, -0.769927978515625, -0.7378692626953125, -0.705810546875, -0.6737518310546875, -0.641693115234375, -0.6096343994140625, -0.57757568359375, -0.5455169677734375, -0.513458251953125, -0.4813995361328125, -0.4493408203125, -0.4172821044921875, -0.385223388671875, -0.3531646728515625, -0.32110595703125, -0.2890472412109375, -0.256988525390625, -0.2249298095703125, -0.19287109375, -0.1608123779296875, -0.128753662109375, -0.0966949462890625, -0.06463623046875, -0.0325775146484375, -0.000518798828125, 0.0315399169921875, 0.0635986328125, 0.0956573486328125, 0.127716064453125, 0.1597747802734375, 0.19183349609375, 0.2238922119140625, 0.255950927734375, 0.2880096435546875, 0.320068359375, 0.3521270751953125, 0.384185791015625, 0.4162445068359375, 0.44830322265625, 0.4803619384765625, 0.512420654296875, 0.5444793701171875, 0.5765380859375, 0.6085968017578125, 0.640655517578125, 0.6727142333984375, 0.70477294921875, 0.7368316650390625, 0.768890380859375, 0.8009490966796875, 0.8330078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 9.0, 4.0, 11.0, 14.0, 21.0, 33.0, 74.0, 112.0, 315.0, 202.0, 73.0, 42.0, 21.0, 16.0, 23.0, 4.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010716915130615234, -0.00010283850133419037, -9.85078513622284e-05, -9.417720139026642e-05, -8.984655141830444e-05, -8.551590144634247e-05, -8.118525147438049e-05, -7.685460150241852e-05, -7.252395153045654e-05, -6.819330155849457e-05, -6.386265158653259e-05, -5.953200161457062e-05, -5.520135164260864e-05, -5.087070167064667e-05, -4.654005169868469e-05, -4.220940172672272e-05, -3.787875175476074e-05, -3.354810178279877e-05, -2.9217451810836792e-05, -2.4886801838874817e-05, -2.0556151866912842e-05, -1.6225501894950867e-05, -1.1894851922988892e-05, -7.5642019510269165e-06, -3.2335519790649414e-06, 1.0970979928970337e-06, 5.427747964859009e-06, 9.758397936820984e-06, 1.4089047908782959e-05, 1.8419697880744934e-05, 2.275034785270691e-05, 2.7080997824668884e-05, 3.141164779663086e-05, 3.5742297768592834e-05, 4.007294774055481e-05, 4.4403597712516785e-05, 4.873424768447876e-05, 5.3064897656440735e-05, 5.739554762840271e-05, 6.172619760036469e-05, 6.605684757232666e-05, 7.038749754428864e-05, 7.471814751625061e-05, 7.904879748821259e-05, 8.337944746017456e-05, 8.771009743213654e-05, 9.204074740409851e-05, 9.637139737606049e-05, 0.00010070204734802246, 0.00010503269731998444, 0.00010936334729194641, 0.00011369399726390839, 0.00011802464723587036, 0.00012235529720783234, 0.0001266859471797943, 0.0001310165971517563, 0.00013534724712371826, 0.00013967789709568024, 0.0001440085470676422, 0.0001483391970396042, 0.00015266984701156616, 0.00015700049698352814, 0.0001613311469554901, 0.0001656617969274521, 0.00016999244689941406]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 11.0, 16.0, 34.0, 76.0, 94.0, 217.0, 368.0, 734.0, 1895.0, 6278.0, 42233.0, 898380.0, 83969.0, 9844.0, 2474.0, 936.0, 411.0, 245.0, 135.0, 71.0, 50.0, 30.0, 13.0, 11.0, 8.0, 4.0, 4.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3095703125, -1.269439697265625, -1.22930908203125, -1.189178466796875, -1.1490478515625, -1.108917236328125, -1.06878662109375, -1.028656005859375, -0.988525390625, -0.948394775390625, -0.90826416015625, -0.868133544921875, -0.8280029296875, -0.787872314453125, -0.74774169921875, -0.707611083984375, -0.66748046875, -0.627349853515625, -0.58721923828125, -0.547088623046875, -0.5069580078125, -0.466827392578125, -0.42669677734375, -0.386566162109375, -0.346435546875, -0.306304931640625, -0.26617431640625, -0.226043701171875, -0.1859130859375, -0.145782470703125, -0.10565185546875, -0.065521240234375, -0.025390625, 0.014739990234375, 0.05487060546875, 0.095001220703125, 0.1351318359375, 0.175262451171875, 0.21539306640625, 0.255523681640625, 0.295654296875, 0.335784912109375, 0.37591552734375, 0.416046142578125, 0.4561767578125, 0.496307373046875, 0.53643798828125, 0.576568603515625, 0.61669921875, 0.656829833984375, 0.69696044921875, 0.737091064453125, 0.7772216796875, 0.817352294921875, 0.85748291015625, 0.897613525390625, 0.937744140625, 0.977874755859375, 1.01800537109375, 1.058135986328125, 1.0982666015625, 1.138397216796875, 1.17852783203125, 1.218658447265625, 1.2587890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 7.0, 15.0, 16.0, 31.0, 39.0, 55.0, 147.0, 428.0, 72.0, 60.0, 25.0, 28.0, 12.0, 8.0, 9.0, 10.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38330078125, -0.3686981201171875, -0.354095458984375, -0.3394927978515625, -0.32489013671875, -0.3102874755859375, -0.295684814453125, -0.2810821533203125, -0.2664794921875, -0.2518768310546875, -0.237274169921875, -0.2226715087890625, -0.20806884765625, -0.1934661865234375, -0.178863525390625, -0.1642608642578125, -0.149658203125, -0.1350555419921875, -0.120452880859375, -0.1058502197265625, -0.09124755859375, -0.0766448974609375, -0.062042236328125, -0.0474395751953125, -0.0328369140625, -0.0182342529296875, -0.003631591796875, 0.0109710693359375, 0.02557373046875, 0.0401763916015625, 0.054779052734375, 0.0693817138671875, 0.083984375, 0.0985870361328125, 0.113189697265625, 0.1277923583984375, 0.14239501953125, 0.1569976806640625, 0.171600341796875, 0.1862030029296875, 0.2008056640625, 0.2154083251953125, 0.230010986328125, 0.2446136474609375, 0.25921630859375, 0.2738189697265625, 0.288421630859375, 0.3030242919921875, 0.317626953125, 0.3322296142578125, 0.346832275390625, 0.3614349365234375, 0.37603759765625, 0.3906402587890625, 0.405242919921875, 0.4198455810546875, 0.4344482421875, 0.4490509033203125, 0.463653564453125, 0.4782562255859375, 0.49285888671875, 0.5074615478515625, 0.522064208984375, 0.5366668701171875, 0.55126953125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 23.0, 163.0, 474.0, 269.0, 69.0, 9.0, 3.0], "bins": [-51.87593460083008, -51.006404876708984, -50.13687515258789, -49.26734161376953, -48.39781188964844, -47.528282165527344, -46.65875244140625, -45.789222717285156, -44.91969299316406, -44.05016326904297, -43.180633544921875, -42.311100006103516, -41.44157028198242, -40.57204055786133, -39.702510833740234, -38.83298110961914, -37.96344757080078, -37.09391784667969, -36.224388122558594, -35.354854583740234, -34.48532485961914, -33.61579513549805, -32.74626541137695, -31.87673568725586, -31.007204055786133, -30.13767433166504, -29.268142700195312, -28.39861297607422, -27.529083251953125, -26.6595516204834, -25.790021896362305, -24.920490264892578, -24.050960540771484, -23.18143081665039, -22.311899185180664, -21.44236946105957, -20.572837829589844, -19.70330810546875, -18.833778381347656, -17.964248657226562, -17.094717025756836, -16.225187301635742, -15.355655670166016, -14.486125946044922, -13.616595268249512, -12.747064590454102, -11.877534866333008, -11.008004188537598, -10.138473510742188, -9.268942832946777, -8.399412155151367, -7.529882431030273, -6.660351753234863, -5.790821075439453, -4.921290874481201, -4.051760673522949, -3.1822304725646973, -2.312700033187866, -1.4431695938110352, -0.5736391544342041, 0.29589128494262695, 1.165421962738037, 2.034952163696289, 2.904482364654541, 3.774013042449951]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 10.0, 4.0, 13.0, 10.0, 15.0, 14.0, 20.0, 14.0, 30.0, 23.0, 25.0, 22.0, 32.0, 34.0, 37.0, 45.0, 42.0, 33.0, 55.0, 53.0, 42.0, 47.0, 50.0, 42.0, 36.0, 36.0, 33.0, 36.0, 26.0, 20.0, 14.0, 21.0, 13.0, 9.0, 12.0, 7.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.7066826820373535, -6.516510486602783, -6.326337814331055, -6.136165618896484, -5.945992946624756, -5.7558207511901855, -5.565648078918457, -5.375475883483887, -5.185303688049316, -4.995131492614746, -4.804958820343018, -4.614786624908447, -4.424613952636719, -4.234441757202148, -4.044269561767578, -3.8540968894958496, -3.6639244556427, -3.473752021789551, -3.2835795879364014, -3.093407154083252, -2.9032349586486816, -2.7130625247955322, -2.522890090942383, -2.3327178955078125, -2.142545223236084, -1.9523727893829346, -1.7622004747390747, -1.5720280408859253, -1.3818557262420654, -1.191683292388916, -1.0015108585357666, -0.8113385438919067, -0.6211662292480469, -0.43099385499954224, -0.2408214509487152, -0.050649046897888184, 0.13952332735061646, 0.3296957015991211, 0.5198681354522705, 0.7100404500961304, 0.9002128839492798, 1.0903853178024292, 1.280557632446289, 1.4707300662994385, 1.660902500152588, 1.8510748147964478, 2.0412473678588867, 2.231419563293457, 2.4215919971466064, 2.611764430999756, 2.8019368648529053, 2.9921092987060547, 3.182281494140625, 3.3724539279937744, 3.562626361846924, 3.752798557281494, 3.9429712295532227, 4.133143424987793, 4.3233160972595215, 4.513488292694092, 4.70366096496582, 4.893833160400391, 5.084005355834961, 5.2741780281066895, 5.46435022354126]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 4.0, 4.0, 7.0, 11.0, 12.0, 16.0, 13.0, 39.0, 42.0, 61.0, 88.0, 160.0, 292.0, 552.0, 1256.0, 3749.0, 14128.0, 135600.0, 3296241.0, 699325.0, 33450.0, 5904.0, 1699.0, 732.0, 341.0, 182.0, 118.0, 71.0, 68.0, 39.0, 29.0, 20.0, 10.0, 8.0, 5.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.3133544921875, -5.134521484375, -4.9556884765625, -4.77685546875, -4.5980224609375, -4.419189453125, -4.2403564453125, -4.0615234375, -3.8826904296875, -3.703857421875, -3.5250244140625, -3.34619140625, -3.1673583984375, -2.988525390625, -2.8096923828125, -2.630859375, -2.4520263671875, -2.273193359375, -2.0943603515625, -1.91552734375, -1.7366943359375, -1.557861328125, -1.3790283203125, -1.2001953125, -1.0213623046875, -0.842529296875, -0.6636962890625, -0.48486328125, -0.3060302734375, -0.127197265625, 0.0516357421875, 0.23046875, 0.4093017578125, 0.588134765625, 0.7669677734375, 0.94580078125, 1.1246337890625, 1.303466796875, 1.4822998046875, 1.6611328125, 1.8399658203125, 2.018798828125, 2.1976318359375, 2.37646484375, 2.5552978515625, 2.734130859375, 2.9129638671875, 3.091796875, 3.2706298828125, 3.449462890625, 3.6282958984375, 3.80712890625, 3.9859619140625, 4.164794921875, 4.3436279296875, 4.5224609375, 4.7012939453125, 4.880126953125, 5.0589599609375, 5.23779296875, 5.4166259765625, 5.595458984375, 5.7742919921875, 5.953125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 7.0, 8.0, 8.0, 5.0, 17.0, 19.0, 18.0, 29.0, 41.0, 51.0, 51.0, 55.0, 65.0, 78.0, 91.0, 72.0, 62.0, 71.0, 44.0, 48.0, 43.0, 34.0, 28.0, 24.0, 8.0, 12.0, 5.0, 1.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.591796875, -2.4971923828125, -2.402587890625, -2.3079833984375, -2.21337890625, -2.1187744140625, -2.024169921875, -1.9295654296875, -1.8349609375, -1.7403564453125, -1.645751953125, -1.5511474609375, -1.45654296875, -1.3619384765625, -1.267333984375, -1.1727294921875, -1.078125, -0.9835205078125, -0.888916015625, -0.7943115234375, -0.69970703125, -0.6051025390625, -0.510498046875, -0.4158935546875, -0.3212890625, -0.2266845703125, -0.132080078125, -0.0374755859375, 0.05712890625, 0.1517333984375, 0.246337890625, 0.3409423828125, 0.435546875, 0.5301513671875, 0.624755859375, 0.7193603515625, 0.81396484375, 0.9085693359375, 1.003173828125, 1.0977783203125, 1.1923828125, 1.2869873046875, 1.381591796875, 1.4761962890625, 1.57080078125, 1.6654052734375, 1.760009765625, 1.8546142578125, 1.94921875, 2.0438232421875, 2.138427734375, 2.2330322265625, 2.32763671875, 2.4222412109375, 2.516845703125, 2.6114501953125, 2.7060546875, 2.8006591796875, 2.895263671875, 2.9898681640625, 3.08447265625, 3.1790771484375, 3.273681640625, 3.3682861328125, 3.462890625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 10.0, 21.0, 34.0, 57.0, 91.0, 329.0, 761.0, 2530.0, 18735.0, 1054185.0, 3081151.0, 30904.0, 3807.0, 992.0, 318.0, 141.0, 69.0, 49.0, 28.0, 10.0, 8.0, 6.0, 9.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.30859375, -5.06829833984375, -4.8280029296875, -4.58770751953125, -4.347412109375, -4.10711669921875, -3.8668212890625, -3.62652587890625, -3.38623046875, -3.14593505859375, -2.9056396484375, -2.66534423828125, -2.425048828125, -2.18475341796875, -1.9444580078125, -1.70416259765625, -1.4638671875, -1.22357177734375, -0.9832763671875, -0.74298095703125, -0.502685546875, -0.26239013671875, -0.0220947265625, 0.21820068359375, 0.45849609375, 0.69879150390625, 0.9390869140625, 1.17938232421875, 1.419677734375, 1.65997314453125, 1.9002685546875, 2.14056396484375, 2.380859375, 2.62115478515625, 2.8614501953125, 3.10174560546875, 3.342041015625, 3.58233642578125, 3.8226318359375, 4.06292724609375, 4.30322265625, 4.54351806640625, 4.7838134765625, 5.02410888671875, 5.264404296875, 5.50469970703125, 5.7449951171875, 5.98529052734375, 6.2255859375, 6.46588134765625, 6.7061767578125, 6.94647216796875, 7.186767578125, 7.42706298828125, 7.6673583984375, 7.90765380859375, 8.14794921875, 8.38824462890625, 8.6285400390625, 8.86883544921875, 9.109130859375, 9.34942626953125, 9.5897216796875, 9.83001708984375, 10.0703125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 10.0, 12.0, 14.0, 32.0, 47.0, 89.0, 129.0, 282.0, 629.0, 967.0, 889.0, 465.0, 230.0, 100.0, 59.0, 34.0, 29.0, 23.0, 18.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.298553466796875, -2.24359130859375, -2.188629150390625, -2.1336669921875, -2.078704833984375, -2.02374267578125, -1.968780517578125, -1.913818359375, -1.858856201171875, -1.80389404296875, -1.748931884765625, -1.6939697265625, -1.639007568359375, -1.58404541015625, -1.529083251953125, -1.47412109375, -1.419158935546875, -1.36419677734375, -1.309234619140625, -1.2542724609375, -1.199310302734375, -1.14434814453125, -1.089385986328125, -1.034423828125, -0.979461669921875, -0.92449951171875, -0.869537353515625, -0.8145751953125, -0.759613037109375, -0.70465087890625, -0.649688720703125, -0.5947265625, -0.539764404296875, -0.48480224609375, -0.429840087890625, -0.3748779296875, -0.319915771484375, -0.26495361328125, -0.209991455078125, -0.155029296875, -0.100067138671875, -0.04510498046875, 0.009857177734375, 0.0648193359375, 0.119781494140625, 0.17474365234375, 0.229705810546875, 0.28466796875, 0.339630126953125, 0.39459228515625, 0.449554443359375, 0.5045166015625, 0.559478759765625, 0.61444091796875, 0.669403076171875, 0.724365234375, 0.779327392578125, 0.83428955078125, 0.889251708984375, 0.9442138671875, 0.999176025390625, 1.05413818359375, 1.109100341796875, 1.1640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 10.0, 19.0, 26.0, 44.0, 64.0, 84.0, 105.0, 113.0, 120.0, 103.0, 97.0, 85.0, 39.0, 22.0, 25.0, 19.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.206478118896484, -8.033744812011719, -7.861011981964111, -7.688278675079346, -7.515545845031738, -7.342812538146973, -7.170079708099365, -6.9973464012146, -6.824613571166992, -6.651880264282227, -6.479147434234619, -6.3064141273498535, -6.133681297302246, -5.9609479904174805, -5.788215160369873, -5.615481853485107, -5.4427490234375, -5.270015716552734, -5.097282886505127, -4.924549579620361, -4.751816749572754, -4.579083442687988, -4.406350612640381, -4.233617305755615, -4.06088399887085, -3.888150930404663, -3.7154178619384766, -3.54268479347229, -3.3699517250061035, -3.197218656539917, -3.0244855880737305, -2.851752281188965, -2.6790192127227783, -2.506286144256592, -2.3335530757904053, -2.1608200073242188, -1.9880869388580322, -1.8153538703918457, -1.6426206827163696, -1.469887614250183, -1.2971545457839966, -1.12442147731781, -0.9516884088516235, -0.7789552807807922, -0.6062222123146057, -0.4334891438484192, -0.2607560157775879, -0.08802294731140137, 0.08471012115478516, 0.2574431896209717, 0.4301762878894806, 0.6029093861579895, 0.775642454624176, 0.9483755230903625, 1.1211086511611938, 1.2938417196273804, 1.466574788093567, 1.6393078565597534, 1.81204092502594, 1.984774112701416, 2.1575071811676025, 2.330240249633789, 2.5029733180999756, 2.675706386566162, 2.8484394550323486]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 11.0, 15.0, 9.0, 14.0, 13.0, 23.0, 21.0, 21.0, 27.0, 28.0, 46.0, 30.0, 46.0, 45.0, 37.0, 39.0, 54.0, 47.0, 46.0, 40.0, 46.0, 41.0, 38.0, 35.0, 32.0, 34.0, 26.0, 26.0, 18.0, 14.0, 9.0, 8.0, 12.0, 7.0, 5.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.432069778442383, -2.3531317710876465, -2.27419376373291, -2.195255756378174, -2.1163179874420166, -2.0373799800872803, -1.958441972732544, -1.8795039653778076, -1.8005659580230713, -1.721627950668335, -1.6426900625228882, -1.5637520551681519, -1.4848140478134155, -1.4058761596679688, -1.3269381523132324, -1.248000144958496, -1.1690622568130493, -1.090124249458313, -1.0111863613128662, -0.9322483539581299, -0.8533103466033936, -0.774372398853302, -0.6954344511032104, -0.6164964437484741, -0.5375584959983826, -0.45862051844596863, -0.3796825408935547, -0.30074459314346313, -0.2218066155910492, -0.14286863803863525, -0.0639306902885437, 0.015007317066192627, 0.09394526481628418, 0.17288324236869812, 0.25182121992111206, 0.3307591676712036, 0.40969714522361755, 0.4886351227760315, 0.567573070526123, 0.6465110778808594, 0.7254490256309509, 0.8043869733810425, 0.8833249807357788, 0.9622629284858704, 1.041200876235962, 1.1201388835906982, 1.1990768909454346, 1.278014898300171, 1.3569527864456177, 1.435890793800354, 1.5148286819458008, 1.593766689300537, 1.6727046966552734, 1.7516427040100098, 1.8305805921554565, 1.9095185995101929, 1.9884564876556396, 2.067394495010376, 2.1463325023651123, 2.2252702713012695, 2.304208278656006, 2.383146286010742, 2.4620842933654785, 2.541022300720215, 2.619960308074951]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 7.0, 17.0, 17.0, 27.0, 31.0, 47.0, 90.0, 132.0, 194.0, 312.0, 494.0, 855.0, 1543.0, 3551.0, 10728.0, 45521.0, 322823.0, 563092.0, 73968.0, 15672.0, 4808.0, 2060.0, 992.0, 548.0, 329.0, 227.0, 147.0, 93.0, 64.0, 49.0, 32.0, 26.0, 21.0, 13.0, 5.0, 6.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9775390625, -0.9497222900390625, -0.921905517578125, -0.8940887451171875, -0.86627197265625, -0.8384552001953125, -0.810638427734375, -0.7828216552734375, -0.7550048828125, -0.7271881103515625, -0.699371337890625, -0.6715545654296875, -0.64373779296875, -0.6159210205078125, -0.588104248046875, -0.5602874755859375, -0.532470703125, -0.5046539306640625, -0.476837158203125, -0.4490203857421875, -0.42120361328125, -0.3933868408203125, -0.365570068359375, -0.3377532958984375, -0.3099365234375, -0.2821197509765625, -0.254302978515625, -0.2264862060546875, -0.19866943359375, -0.1708526611328125, -0.143035888671875, -0.1152191162109375, -0.08740234375, -0.0595855712890625, -0.031768798828125, -0.0039520263671875, 0.02386474609375, 0.0516815185546875, 0.079498291015625, 0.1073150634765625, 0.1351318359375, 0.1629486083984375, 0.190765380859375, 0.2185821533203125, 0.24639892578125, 0.2742156982421875, 0.302032470703125, 0.3298492431640625, 0.357666015625, 0.3854827880859375, 0.413299560546875, 0.4411163330078125, 0.46893310546875, 0.4967498779296875, 0.524566650390625, 0.5523834228515625, 0.5802001953125, 0.6080169677734375, 0.635833740234375, 0.6636505126953125, 0.69146728515625, 0.7192840576171875, 0.747100830078125, 0.7749176025390625, 0.802734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 12.0, 6.0, 8.0, 14.0, 16.0, 19.0, 30.0, 27.0, 36.0, 36.0, 37.0, 47.0, 44.0, 65.0, 51.0, 64.0, 53.0, 61.0, 64.0, 42.0, 54.0, 40.0, 33.0, 29.0, 28.0, 14.0, 20.0, 18.0, 6.0, 5.0, 10.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.977386474609375, -1.90789794921875, -1.838409423828125, -1.7689208984375, -1.699432373046875, -1.62994384765625, -1.560455322265625, -1.490966796875, -1.421478271484375, -1.35198974609375, -1.282501220703125, -1.2130126953125, -1.143524169921875, -1.07403564453125, -1.004547119140625, -0.93505859375, -0.865570068359375, -0.79608154296875, -0.726593017578125, -0.6571044921875, -0.587615966796875, -0.51812744140625, -0.448638916015625, -0.379150390625, -0.309661865234375, -0.24017333984375, -0.170684814453125, -0.1011962890625, -0.031707763671875, 0.03778076171875, 0.107269287109375, 0.1767578125, 0.246246337890625, 0.31573486328125, 0.385223388671875, 0.4547119140625, 0.524200439453125, 0.59368896484375, 0.663177490234375, 0.732666015625, 0.802154541015625, 0.87164306640625, 0.941131591796875, 1.0106201171875, 1.080108642578125, 1.14959716796875, 1.219085693359375, 1.28857421875, 1.358062744140625, 1.42755126953125, 1.497039794921875, 1.5665283203125, 1.636016845703125, 1.70550537109375, 1.774993896484375, 1.844482421875, 1.913970947265625, 1.98345947265625, 2.052947998046875, 2.1224365234375, 2.191925048828125, 2.26141357421875, 2.330902099609375, 2.400390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 8.0, 11.0, 10.0, 20.0, 21.0, 40.0, 63.0, 84.0, 115.0, 183.0, 299.0, 395.0, 628.0, 1003.0, 1637.0, 2536.0, 4384.0, 7207.0, 13133.0, 24816.0, 50796.0, 113204.0, 285807.0, 304974.0, 122073.0, 53741.0, 27054.0, 14070.0, 8020.0, 4719.0, 2743.0, 1707.0, 1095.0, 671.0, 413.0, 269.0, 187.0, 135.0, 83.0, 61.0, 38.0, 34.0, 14.0, 8.0, 7.0, 11.0, 3.0, 8.0, 1.0, 1.0, 5.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.230224609375, -0.2230396270751953, -0.21585464477539062, -0.20866966247558594, -0.20148468017578125, -0.19429969787597656, -0.18711471557617188, -0.1799297332763672, -0.1727447509765625, -0.1655597686767578, -0.15837478637695312, -0.15118980407714844, -0.14400482177734375, -0.13681983947753906, -0.12963485717773438, -0.12244987487792969, -0.115264892578125, -0.10807991027832031, -0.10089492797851562, -0.09370994567871094, -0.08652496337890625, -0.07933998107910156, -0.07215499877929688, -0.06497001647949219, -0.0577850341796875, -0.05060005187988281, -0.043415069580078125, -0.03623008728027344, -0.02904510498046875, -0.021860122680664062, -0.014675140380859375, -0.0074901580810546875, -0.00030517578125, 0.0068798065185546875, 0.014064788818359375, 0.021249771118164062, 0.02843475341796875, 0.03561973571777344, 0.042804718017578125, 0.04998970031738281, 0.0571746826171875, 0.06435966491699219, 0.07154464721679688, 0.07872962951660156, 0.08591461181640625, 0.09309959411621094, 0.10028457641601562, 0.10746955871582031, 0.114654541015625, 0.12183952331542969, 0.12902450561523438, 0.13620948791503906, 0.14339447021484375, 0.15057945251464844, 0.15776443481445312, 0.1649494171142578, 0.1721343994140625, 0.1793193817138672, 0.18650436401367188, 0.19368934631347656, 0.20087432861328125, 0.20805931091308594, 0.21524429321289062, 0.2224292755126953, 0.2296142578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 3.0, 7.0, 9.0, 6.0, 14.0, 13.0, 5.0, 10.0, 13.0, 17.0, 19.0, 34.0, 21.0, 36.0, 40.0, 40.0, 44.0, 37.0, 43.0, 57.0, 53.0, 41.0, 58.0, 52.0, 50.0, 26.0, 46.0, 36.0, 37.0, 17.0, 27.0, 13.0, 11.0, 13.0, 11.0, 9.0, 6.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.140625, -4.02056884765625, -3.9005126953125, -3.78045654296875, -3.660400390625, -3.54034423828125, -3.4202880859375, -3.30023193359375, -3.18017578125, -3.06011962890625, -2.9400634765625, -2.82000732421875, -2.699951171875, -2.57989501953125, -2.4598388671875, -2.33978271484375, -2.2197265625, -2.09967041015625, -1.9796142578125, -1.85955810546875, -1.739501953125, -1.61944580078125, -1.4993896484375, -1.37933349609375, -1.25927734375, -1.13922119140625, -1.0191650390625, -0.89910888671875, -0.779052734375, -0.65899658203125, -0.5389404296875, -0.41888427734375, -0.298828125, -0.17877197265625, -0.0587158203125, 0.06134033203125, 0.181396484375, 0.30145263671875, 0.4215087890625, 0.54156494140625, 0.66162109375, 0.78167724609375, 0.9017333984375, 1.02178955078125, 1.141845703125, 1.26190185546875, 1.3819580078125, 1.50201416015625, 1.6220703125, 1.74212646484375, 1.8621826171875, 1.98223876953125, 2.102294921875, 2.22235107421875, 2.3424072265625, 2.46246337890625, 2.58251953125, 2.70257568359375, 2.8226318359375, 2.94268798828125, 3.062744140625, 3.18280029296875, 3.3028564453125, 3.42291259765625, 3.54296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 10.0, 9.0, 22.0, 25.0, 49.0, 86.0, 143.0, 254.0, 610.0, 1492.0, 5119.0, 31914.0, 585387.0, 391962.0, 24501.0, 4453.0, 1345.0, 529.0, 258.0, 143.0, 85.0, 53.0, 35.0, 22.0, 12.0, 10.0, 11.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08428955078125, -0.08137702941894531, -0.07846450805664062, -0.07555198669433594, -0.07263946533203125, -0.06972694396972656, -0.06681442260742188, -0.06390190124511719, -0.0609893798828125, -0.05807685852050781, -0.055164337158203125, -0.05225181579589844, -0.04933929443359375, -0.04642677307128906, -0.043514251708984375, -0.04060173034667969, -0.037689208984375, -0.03477668762207031, -0.031864166259765625, -0.028951644897460938, -0.02603912353515625, -0.023126602172851562, -0.020214080810546875, -0.017301559448242188, -0.0143890380859375, -0.011476516723632812, -0.008563995361328125, -0.0056514739990234375, -0.00273895263671875, 0.0001735687255859375, 0.003086090087890625, 0.0059986114501953125, 0.0089111328125, 0.011823654174804688, 0.014736175537109375, 0.017648696899414062, 0.02056121826171875, 0.023473739624023438, 0.026386260986328125, 0.029298782348632812, 0.0322113037109375, 0.03512382507324219, 0.038036346435546875, 0.04094886779785156, 0.04386138916015625, 0.04677391052246094, 0.049686431884765625, 0.05259895324707031, 0.055511474609375, 0.05842399597167969, 0.061336517333984375, 0.06424903869628906, 0.06716156005859375, 0.07007408142089844, 0.07298660278320312, 0.07589912414550781, 0.0788116455078125, 0.08172416687011719, 0.08463668823242188, 0.08754920959472656, 0.09046173095703125, 0.09337425231933594, 0.09628677368164062, 0.09919929504394531, 0.10211181640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 7.0, 4.0, 4.0, 8.0, 13.0, 11.0, 25.0, 36.0, 50.0, 62.0, 106.0, 109.0, 126.0, 109.0, 94.0, 66.0, 45.0, 34.0, 32.0, 18.0, 15.0, 10.0, 10.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0], "bins": [-6.35385513305664e-05, -6.20819628238678e-05, -6.062537431716919e-05, -5.916878581047058e-05, -5.771219730377197e-05, -5.6255608797073364e-05, -5.4799020290374756e-05, -5.334243178367615e-05, -5.188584327697754e-05, -5.042925477027893e-05, -4.897266626358032e-05, -4.7516077756881714e-05, -4.6059489250183105e-05, -4.46029007434845e-05, -4.314631223678589e-05, -4.168972373008728e-05, -4.023313522338867e-05, -3.8776546716690063e-05, -3.7319958209991455e-05, -3.586336970329285e-05, -3.440678119659424e-05, -3.295019268989563e-05, -3.149360418319702e-05, -3.0037015676498413e-05, -2.8580427169799805e-05, -2.7123838663101196e-05, -2.5667250156402588e-05, -2.421066164970398e-05, -2.275407314300537e-05, -2.1297484636306763e-05, -1.9840896129608154e-05, -1.8384307622909546e-05, -1.6927719116210938e-05, -1.547113060951233e-05, -1.401454210281372e-05, -1.2557953596115112e-05, -1.1101365089416504e-05, -9.644776582717896e-06, -8.188188076019287e-06, -6.731599569320679e-06, -5.27501106262207e-06, -3.818422555923462e-06, -2.3618340492248535e-06, -9.052455425262451e-07, 5.513429641723633e-07, 2.0079314708709717e-06, 3.46451997756958e-06, 4.9211084842681885e-06, 6.377696990966797e-06, 7.834285497665405e-06, 9.290874004364014e-06, 1.0747462511062622e-05, 1.220405101776123e-05, 1.3660639524459839e-05, 1.5117228031158447e-05, 1.6573816537857056e-05, 1.8030405044555664e-05, 1.9486993551254272e-05, 2.094358205795288e-05, 2.240017056465149e-05, 2.3856759071350098e-05, 2.5313347578048706e-05, 2.6769936084747314e-05, 2.8226524591445923e-05, 2.968311309814453e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 14.0, 29.0, 39.0, 80.0, 142.0, 286.0, 714.0, 2256.0, 10163.0, 80094.0, 849057.0, 90401.0, 11362.0, 2524.0, 756.0, 322.0, 144.0, 53.0, 38.0, 21.0, 8.0, 9.0, 4.0, 12.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1329345703125, -0.1289691925048828, -0.12500381469726562, -0.12103843688964844, -0.11707305908203125, -0.11310768127441406, -0.10914230346679688, -0.10517692565917969, -0.1012115478515625, -0.09724617004394531, -0.09328079223632812, -0.08931541442871094, -0.08535003662109375, -0.08138465881347656, -0.07741928100585938, -0.07345390319824219, -0.069488525390625, -0.06552314758300781, -0.061557769775390625, -0.05759239196777344, -0.05362701416015625, -0.04966163635253906, -0.045696258544921875, -0.04173088073730469, -0.0377655029296875, -0.03380012512207031, -0.029834747314453125, -0.025869369506835938, -0.02190399169921875, -0.017938613891601562, -0.013973236083984375, -0.010007858276367188, -0.00604248046875, -0.0020771026611328125, 0.001888275146484375, 0.0058536529541015625, 0.00981903076171875, 0.013784408569335938, 0.017749786376953125, 0.021715164184570312, 0.0256805419921875, 0.029645919799804688, 0.033611297607421875, 0.03757667541503906, 0.04154205322265625, 0.04550743103027344, 0.049472808837890625, 0.05343818664550781, 0.057403564453125, 0.06136894226074219, 0.06533432006835938, 0.06929969787597656, 0.07326507568359375, 0.07723045349121094, 0.08119583129882812, 0.08516120910644531, 0.0891265869140625, 0.09309196472167969, 0.09705734252929688, 0.10102272033691406, 0.10498809814453125, 0.10895347595214844, 0.11291885375976562, 0.11688423156738281, 0.120849609375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 7.0, 6.0, 6.0, 10.0, 26.0, 30.0, 70.0, 90.0, 202.0, 232.0, 131.0, 73.0, 37.0, 18.0, 17.0, 13.0, 9.0, 5.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02728271484375, -0.026459932327270508, -0.025637149810791016, -0.024814367294311523, -0.02399158477783203, -0.02316880226135254, -0.022346019744873047, -0.021523237228393555, -0.020700454711914062, -0.01987767219543457, -0.019054889678955078, -0.018232107162475586, -0.017409324645996094, -0.0165865421295166, -0.01576375961303711, -0.014940977096557617, -0.014118194580078125, -0.013295412063598633, -0.01247262954711914, -0.011649847030639648, -0.010827064514160156, -0.010004281997680664, -0.009181499481201172, -0.00835871696472168, -0.0075359344482421875, -0.006713151931762695, -0.005890369415283203, -0.005067586898803711, -0.004244804382324219, -0.0034220218658447266, -0.0025992393493652344, -0.0017764568328857422, -0.00095367431640625, -0.0001308917999267578, 0.0006918907165527344, 0.0015146732330322266, 0.0023374557495117188, 0.003160238265991211, 0.003983020782470703, 0.004805803298950195, 0.0056285858154296875, 0.00645136833190918, 0.007274150848388672, 0.008096933364868164, 0.008919715881347656, 0.009742498397827148, 0.01056528091430664, 0.011388063430786133, 0.012210845947265625, 0.013033628463745117, 0.01385641098022461, 0.014679193496704102, 0.015501976013183594, 0.016324758529663086, 0.017147541046142578, 0.01797032356262207, 0.018793106079101562, 0.019615888595581055, 0.020438671112060547, 0.02126145362854004, 0.02208423614501953, 0.022907018661499023, 0.023729801177978516, 0.024552583694458008, 0.0253753662109375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 9.0, 22.0, 54.0, 104.0, 165.0, 212.0, 189.0, 122.0, 61.0, 36.0, 15.0, 10.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.862611770629883, -5.671850681304932, -5.481089115142822, -5.290328025817871, -5.09956693649292, -4.908805847167969, -4.718044281005859, -4.527283191680908, -4.336522102355957, -4.145761013031006, -3.9549996852874756, -3.7642383575439453, -3.573477268218994, -3.382715940475464, -3.1919546127319336, -3.0011935234069824, -2.810431957244873, -2.6196706295013428, -2.4289095401763916, -2.2381482124328613, -2.04738712310791, -1.8566257953643799, -1.6658644676208496, -1.4751032590866089, -1.2843420505523682, -1.0935808420181274, -0.9028195738792419, -0.7120583057403564, -0.5212970972061157, -0.330535888671875, -0.13977456092834473, 0.050986647605895996, 0.24174737930297852, 0.4325086176395416, 0.6232698559761047, 0.8140311241149902, 1.004792332649231, 1.1955535411834717, 1.386314868927002, 1.5770760774612427, 1.7678372859954834, 1.9585984945297241, 2.149359703063965, 2.340121030807495, 2.5308823585510254, 2.7216434478759766, 2.912404775619507, 3.103166103363037, 3.2939271926879883, 3.4846885204315186, 3.6754496097564697, 3.8662109375, 4.056972026824951, 4.247733116149902, 4.438494682312012, 4.629255771636963, 4.820016860961914, 5.010777950286865, 5.201539516448975, 5.392300605773926, 5.583061695098877, 5.773822784423828, 5.9645843505859375, 6.155345439910889, 6.346107006072998]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 3.0, 13.0, 15.0, 20.0, 15.0, 25.0, 33.0, 29.0, 50.0, 49.0, 56.0, 64.0, 50.0, 68.0, 66.0, 67.0, 53.0, 55.0, 55.0, 41.0, 38.0, 32.0, 30.0, 15.0, 8.0, 14.0, 13.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.867017388343811, -1.79472017288208, -1.7224228382110596, -1.650125503540039, -1.577828288078308, -1.5055310726165771, -1.4332337379455566, -1.3609364032745361, -1.2886391878128052, -1.2163419723510742, -1.1440446376800537, -1.0717473030090332, -0.9994500875473022, -0.9271528124809265, -0.8548555374145508, -0.782558262348175, -0.7102609872817993, -0.6379637122154236, -0.5656664371490479, -0.4933691620826721, -0.4210718870162964, -0.34877461194992065, -0.2764773368835449, -0.2041800618171692, -0.13188278675079346, -0.059585511684417725, 0.012711763381958008, 0.08500903844833374, 0.15730631351470947, 0.2296035885810852, 0.30190086364746094, 0.37419813871383667, 0.44649529457092285, 0.5187925696372986, 0.5910898447036743, 0.66338711977005, 0.7356843948364258, 0.8079816699028015, 0.8802789449691772, 0.952576220035553, 1.0248734951019287, 1.0971708297729492, 1.1694680452346802, 1.2417652606964111, 1.3140625953674316, 1.3863599300384521, 1.458657145500183, 1.530954360961914, 1.6032516956329346, 1.675549030303955, 1.747846245765686, 1.820143461227417, 1.8924407958984375, 1.964738130569458, 2.0370354652404785, 2.10933256149292, 2.1816298961639404, 2.253927230834961, 2.3262243270874023, 2.398521661758423, 2.4708189964294434, 2.543116331100464, 2.6154136657714844, 2.687710762023926, 2.7600080966949463]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 16.0, 14.0, 28.0, 42.0, 65.0, 117.0, 153.0, 299.0, 587.0, 1108.0, 2681.0, 7492.0, 26927.0, 150235.0, 686589.0, 135074.0, 24952.0, 7142.0, 2609.0, 1066.0, 560.0, 284.0, 204.0, 104.0, 65.0, 39.0, 27.0, 20.0, 12.0, 5.0, 3.0, 7.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.552734375, -2.46612548828125, -2.3795166015625, -2.29290771484375, -2.206298828125, -2.11968994140625, -2.0330810546875, -1.94647216796875, -1.85986328125, -1.77325439453125, -1.6866455078125, -1.60003662109375, -1.513427734375, -1.42681884765625, -1.3402099609375, -1.25360107421875, -1.1669921875, -1.08038330078125, -0.9937744140625, -0.90716552734375, -0.820556640625, -0.73394775390625, -0.6473388671875, -0.56072998046875, -0.47412109375, -0.38751220703125, -0.3009033203125, -0.21429443359375, -0.127685546875, -0.04107666015625, 0.0455322265625, 0.13214111328125, 0.21875, 0.30535888671875, 0.3919677734375, 0.47857666015625, 0.565185546875, 0.65179443359375, 0.7384033203125, 0.82501220703125, 0.91162109375, 0.99822998046875, 1.0848388671875, 1.17144775390625, 1.258056640625, 1.34466552734375, 1.4312744140625, 1.51788330078125, 1.6044921875, 1.69110107421875, 1.7777099609375, 1.86431884765625, 1.950927734375, 2.03753662109375, 2.1241455078125, 2.21075439453125, 2.29736328125, 2.38397216796875, 2.4705810546875, 2.55718994140625, 2.643798828125, 2.73040771484375, 2.8170166015625, 2.90362548828125, 2.990234375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 8.0, 10.0, 5.0, 17.0, 15.0, 21.0, 34.0, 45.0, 42.0, 39.0, 44.0, 64.0, 66.0, 50.0, 53.0, 58.0, 57.0, 54.0, 45.0, 47.0, 41.0, 44.0, 35.0, 25.0, 22.0, 12.0, 11.0, 8.0, 9.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.51171875, -4.381134033203125, -4.25054931640625, -4.119964599609375, -3.9893798828125, -3.858795166015625, -3.72821044921875, -3.597625732421875, -3.467041015625, -3.336456298828125, -3.20587158203125, -3.075286865234375, -2.9447021484375, -2.814117431640625, -2.68353271484375, -2.552947998046875, -2.42236328125, -2.291778564453125, -2.16119384765625, -2.030609130859375, -1.9000244140625, -1.769439697265625, -1.63885498046875, -1.508270263671875, -1.377685546875, -1.247100830078125, -1.11651611328125, -0.985931396484375, -0.8553466796875, -0.724761962890625, -0.59417724609375, -0.463592529296875, -0.3330078125, -0.202423095703125, -0.07183837890625, 0.058746337890625, 0.1893310546875, 0.319915771484375, 0.45050048828125, 0.581085205078125, 0.711669921875, 0.842254638671875, 0.97283935546875, 1.103424072265625, 1.2340087890625, 1.364593505859375, 1.49517822265625, 1.625762939453125, 1.75634765625, 1.886932373046875, 2.01751708984375, 2.148101806640625, 2.2786865234375, 2.409271240234375, 2.53985595703125, 2.670440673828125, 2.801025390625, 2.931610107421875, 3.06219482421875, 3.192779541015625, 3.3233642578125, 3.453948974609375, 3.58453369140625, 3.715118408203125, 3.845703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 5.0, 2.0, 9.0, 12.0, 10.0, 16.0, 13.0, 23.0, 31.0, 44.0, 55.0, 75.0, 132.0, 270.0, 728.0, 3526.0, 50577.0, 953998.0, 34859.0, 2799.0, 682.0, 239.0, 119.0, 80.0, 48.0, 40.0, 36.0, 20.0, 25.0, 17.0, 8.0, 5.0, 14.0, 8.0, 10.0, 1.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.6484375, -8.41748046875, -8.1865234375, -7.95556640625, -7.724609375, -7.49365234375, -7.2626953125, -7.03173828125, -6.80078125, -6.56982421875, -6.3388671875, -6.10791015625, -5.876953125, -5.64599609375, -5.4150390625, -5.18408203125, -4.953125, -4.72216796875, -4.4912109375, -4.26025390625, -4.029296875, -3.79833984375, -3.5673828125, -3.33642578125, -3.10546875, -2.87451171875, -2.6435546875, -2.41259765625, -2.181640625, -1.95068359375, -1.7197265625, -1.48876953125, -1.2578125, -1.02685546875, -0.7958984375, -0.56494140625, -0.333984375, -0.10302734375, 0.1279296875, 0.35888671875, 0.58984375, 0.82080078125, 1.0517578125, 1.28271484375, 1.513671875, 1.74462890625, 1.9755859375, 2.20654296875, 2.4375, 2.66845703125, 2.8994140625, 3.13037109375, 3.361328125, 3.59228515625, 3.8232421875, 4.05419921875, 4.28515625, 4.51611328125, 4.7470703125, 4.97802734375, 5.208984375, 5.43994140625, 5.6708984375, 5.90185546875, 6.1328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 6.0, 9.0, 12.0, 5.0, 9.0, 5.0, 17.0, 16.0, 18.0, 25.0, 26.0, 28.0, 28.0, 34.0, 38.0, 35.0, 49.0, 52.0, 46.0, 45.0, 53.0, 44.0, 47.0, 50.0, 32.0, 38.0, 26.0, 30.0, 35.0, 17.0, 27.0, 15.0, 16.0, 12.0, 7.0, 9.0, 10.0, 7.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.827880859375, -3.70654296875, -3.585205078125, -3.4638671875, -3.342529296875, -3.22119140625, -3.099853515625, -2.978515625, -2.857177734375, -2.73583984375, -2.614501953125, -2.4931640625, -2.371826171875, -2.25048828125, -2.129150390625, -2.0078125, -1.886474609375, -1.76513671875, -1.643798828125, -1.5224609375, -1.401123046875, -1.27978515625, -1.158447265625, -1.037109375, -0.915771484375, -0.79443359375, -0.673095703125, -0.5517578125, -0.430419921875, -0.30908203125, -0.187744140625, -0.06640625, 0.054931640625, 0.17626953125, 0.297607421875, 0.4189453125, 0.540283203125, 0.66162109375, 0.782958984375, 0.904296875, 1.025634765625, 1.14697265625, 1.268310546875, 1.3896484375, 1.510986328125, 1.63232421875, 1.753662109375, 1.875, 1.996337890625, 2.11767578125, 2.239013671875, 2.3603515625, 2.481689453125, 2.60302734375, 2.724365234375, 2.845703125, 2.967041015625, 3.08837890625, 3.209716796875, 3.3310546875, 3.452392578125, 3.57373046875, 3.695068359375, 3.81640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 8.0, 12.0, 20.0, 31.0, 47.0, 73.0, 151.0, 297.0, 888.0, 3647.0, 24149.0, 328584.0, 646697.0, 37163.0, 4954.0, 1033.0, 364.0, 185.0, 84.0, 50.0, 34.0, 13.0, 11.0, 16.0, 9.0, 9.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.90087890625, -0.8663558959960938, -0.8318328857421875, -0.7973098754882812, -0.762786865234375, -0.7282638549804688, -0.6937408447265625, -0.6592178344726562, -0.62469482421875, -0.5901718139648438, -0.5556488037109375, -0.5211257934570312, -0.486602783203125, -0.45207977294921875, -0.4175567626953125, -0.38303375244140625, -0.3485107421875, -0.31398773193359375, -0.2794647216796875, -0.24494171142578125, -0.210418701171875, -0.17589569091796875, -0.1413726806640625, -0.10684967041015625, -0.07232666015625, -0.03780364990234375, -0.0032806396484375, 0.03124237060546875, 0.065765380859375, 0.10028839111328125, 0.1348114013671875, 0.16933441162109375, 0.203857421875, 0.23838043212890625, 0.2729034423828125, 0.30742645263671875, 0.341949462890625, 0.37647247314453125, 0.4109954833984375, 0.44551849365234375, 0.48004150390625, 0.5145645141601562, 0.5490875244140625, 0.5836105346679688, 0.618133544921875, 0.6526565551757812, 0.6871795654296875, 0.7217025756835938, 0.7562255859375, 0.7907485961914062, 0.8252716064453125, 0.8597946166992188, 0.894317626953125, 0.9288406372070312, 0.9633636474609375, 0.9978866577148438, 1.03240966796875, 1.0669326782226562, 1.1014556884765625, 1.1359786987304688, 1.170501708984375, 1.2050247192382812, 1.2395477294921875, 1.2740707397460938, 1.30859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 10.0, 11.0, 12.0, 11.0, 23.0, 28.0, 33.0, 49.0, 52.0, 79.0, 113.0, 139.0, 126.0, 91.0, 55.0, 52.0, 16.0, 25.0, 12.0, 14.0, 11.0, 7.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010645389556884766, -0.00010307691991329193, -9.96999442577362e-05, -9.632296860218048e-05, -9.294599294662476e-05, -8.956901729106903e-05, -8.61920416355133e-05, -8.281506597995758e-05, -7.943809032440186e-05, -7.606111466884613e-05, -7.26841390132904e-05, -6.930716335773468e-05, -6.593018770217896e-05, -6.255321204662323e-05, -5.9176236391067505e-05, -5.579926073551178e-05, -5.2422285079956055e-05, -4.904530942440033e-05, -4.5668333768844604e-05, -4.229135811328888e-05, -3.8914382457733154e-05, -3.553740680217743e-05, -3.2160431146621704e-05, -2.878345549106598e-05, -2.5406479835510254e-05, -2.202950417995453e-05, -1.8652528524398804e-05, -1.527555286884308e-05, -1.1898577213287354e-05, -8.521601557731628e-06, -5.144625902175903e-06, -1.7676502466201782e-06, 1.6093254089355469e-06, 4.986301064491272e-06, 8.363276720046997e-06, 1.1740252375602722e-05, 1.5117228031158447e-05, 1.8494203686714172e-05, 2.1871179342269897e-05, 2.5248154997825623e-05, 2.8625130653381348e-05, 3.200210630893707e-05, 3.53790819644928e-05, 3.875605762004852e-05, 4.213303327560425e-05, 4.551000893115997e-05, 4.88869845867157e-05, 5.226396024227142e-05, 5.564093589782715e-05, 5.9017911553382874e-05, 6.23948872089386e-05, 6.577186286449432e-05, 6.914883852005005e-05, 7.252581417560577e-05, 7.59027898311615e-05, 7.927976548671722e-05, 8.265674114227295e-05, 8.603371679782867e-05, 8.94106924533844e-05, 9.278766810894012e-05, 9.616464376449585e-05, 9.954161942005157e-05, 0.0001029185950756073, 0.00010629557073116302, 0.00010967254638671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 10.0, 9.0, 29.0, 56.0, 128.0, 316.0, 759.0, 2037.0, 7328.0, 54202.0, 839349.0, 127767.0, 12058.0, 2872.0, 980.0, 361.0, 147.0, 69.0, 43.0, 18.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.207794189453125, -1.16070556640625, -1.113616943359375, -1.0665283203125, -1.019439697265625, -0.97235107421875, -0.925262451171875, -0.878173828125, -0.831085205078125, -0.78399658203125, -0.736907958984375, -0.6898193359375, -0.642730712890625, -0.59564208984375, -0.548553466796875, -0.50146484375, -0.454376220703125, -0.40728759765625, -0.360198974609375, -0.3131103515625, -0.266021728515625, -0.21893310546875, -0.171844482421875, -0.124755859375, -0.077667236328125, -0.03057861328125, 0.016510009765625, 0.0635986328125, 0.110687255859375, 0.15777587890625, 0.204864501953125, 0.251953125, 0.299041748046875, 0.34613037109375, 0.393218994140625, 0.4403076171875, 0.487396240234375, 0.53448486328125, 0.581573486328125, 0.628662109375, 0.675750732421875, 0.72283935546875, 0.769927978515625, 0.8170166015625, 0.864105224609375, 0.91119384765625, 0.958282470703125, 1.00537109375, 1.052459716796875, 1.09954833984375, 1.146636962890625, 1.1937255859375, 1.240814208984375, 1.28790283203125, 1.334991455078125, 1.382080078125, 1.429168701171875, 1.47625732421875, 1.523345947265625, 1.5704345703125, 1.617523193359375, 1.66461181640625, 1.711700439453125, 1.7587890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 15.0, 21.0, 26.0, 52.0, 79.0, 122.0, 204.0, 197.0, 93.0, 65.0, 28.0, 33.0, 27.0, 15.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6722526550292969, -0.6540756225585938, -0.6358985900878906, -0.6177215576171875, -0.5995445251464844, -0.5813674926757812, -0.5631904602050781, -0.545013427734375, -0.5268363952636719, -0.5086593627929688, -0.4904823303222656, -0.4723052978515625, -0.4541282653808594, -0.43595123291015625, -0.4177742004394531, -0.39959716796875, -0.3814201354980469, -0.36324310302734375, -0.3450660705566406, -0.3268890380859375, -0.3087120056152344, -0.29053497314453125, -0.2723579406738281, -0.254180908203125, -0.23600387573242188, -0.21782684326171875, -0.19964981079101562, -0.1814727783203125, -0.16329574584960938, -0.14511871337890625, -0.12694168090820312, -0.1087646484375, -0.09058761596679688, -0.07241058349609375, -0.054233551025390625, -0.0360565185546875, -0.017879486083984375, 0.00029754638671875, 0.018474578857421875, 0.036651611328125, 0.054828643798828125, 0.07300567626953125, 0.09118270874023438, 0.1093597412109375, 0.12753677368164062, 0.14571380615234375, 0.16389083862304688, 0.18206787109375, 0.20024490356445312, 0.21842193603515625, 0.23659896850585938, 0.2547760009765625, 0.2729530334472656, 0.29113006591796875, 0.3093070983886719, 0.327484130859375, 0.3456611633300781, 0.36383819580078125, 0.3820152282714844, 0.4001922607421875, 0.4183692932128906, 0.43654632568359375, 0.4547233581542969, 0.472900390625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 15.0, 27.0, 45.0, 43.0, 71.0, 81.0, 88.0, 104.0, 109.0, 84.0, 75.0, 74.0, 50.0, 33.0, 23.0, 16.0, 20.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.314308166503906, -6.128770351409912, -5.943232536315918, -5.757694721221924, -5.57215690612793, -5.386618614196777, -5.201080799102783, -5.015542984008789, -4.830005168914795, -4.644467353820801, -4.458929538726807, -4.2733917236328125, -4.08785343170166, -3.902315855026245, -3.716777801513672, -3.5312399864196777, -3.3457021713256836, -3.1601643562316895, -2.9746265411376953, -2.789088487625122, -2.603550672531128, -2.418012857437134, -2.2324748039245605, -2.0469369888305664, -1.8613991737365723, -1.6758613586425781, -1.4903234243392944, -1.3047854900360107, -1.1192476749420166, -0.9337098002433777, -0.7481719255447388, -0.5626339912414551, -0.37709569931030273, -0.19155782461166382, -0.006019949913024902, 0.179517924785614, 0.36505579948425293, 0.5505936741828918, 0.7361315488815308, 0.9216694831848145, 1.1072072982788086, 1.2927451133728027, 1.4782830476760864, 1.6638209819793701, 1.8493587970733643, 2.0348966121673584, 2.2204346656799316, 2.405972480773926, 2.59151029586792, 2.777048110961914, 2.962585926055908, 3.1481239795684814, 3.3336617946624756, 3.5191996097564697, 3.704737663269043, 3.890275478363037, 4.075813293457031, 4.261351108551025, 4.4468889236450195, 4.632426738739014, 4.817964553833008, 5.00350284576416, 5.189040660858154, 5.374578475952148, 5.560116291046143]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 7.0, 4.0, 5.0, 12.0, 10.0, 19.0, 5.0, 14.0, 16.0, 22.0, 23.0, 26.0, 18.0, 29.0, 26.0, 27.0, 33.0, 35.0, 21.0, 34.0, 31.0, 38.0, 46.0, 42.0, 40.0, 29.0, 40.0, 26.0, 31.0, 26.0, 38.0, 25.0, 21.0, 31.0, 13.0, 21.0, 12.0, 22.0, 22.0, 13.0, 10.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.3152008056640625, -5.153570175170898, -4.991939544677734, -4.830308437347412, -4.668677806854248, -4.507047176361084, -4.345416069030762, -4.183785438537598, -4.022154808044434, -3.8605241775512695, -3.6988933086395264, -3.537262439727783, -3.375631809234619, -3.214001178741455, -3.052370309829712, -2.8907394409179688, -2.7291088104248047, -2.5674781799316406, -2.4058473110198975, -2.2442164421081543, -2.0825858116149902, -1.9209550619125366, -1.759324312210083, -1.5976935625076294, -1.4360628128051758, -1.2744320631027222, -1.1128013134002686, -0.9511705636978149, -0.7895398139953613, -0.6279090642929077, -0.4662783145904541, -0.3046475648880005, -0.14301681518554688, 0.01861393451690674, 0.18024468421936035, 0.34187543392181396, 0.5035061836242676, 0.6651369333267212, 0.8267676830291748, 0.9883984327316284, 1.150029182434082, 1.3116599321365356, 1.4732906818389893, 1.6349214315414429, 1.7965521812438965, 1.95818293094635, 2.1198136806488037, 2.281444549560547, 2.443075180053711, 2.604705810546875, 2.766336679458618, 2.9279675483703613, 3.0895981788635254, 3.2512288093566895, 3.4128596782684326, 3.574490547180176, 3.73612117767334, 3.897751808166504, 4.059382438659668, 4.22101354598999, 4.382644176483154, 4.544274806976318, 4.705905914306641, 4.867536544799805, 5.029167175292969]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 5.0, 5.0, 11.0, 24.0, 27.0, 37.0, 43.0, 78.0, 139.0, 206.0, 361.0, 781.0, 1777.0, 5153.0, 17465.0, 129847.0, 2555025.0, 1398102.0, 67743.0, 11553.0, 3272.0, 1259.0, 585.0, 288.0, 179.0, 120.0, 67.0, 41.0, 23.0, 16.0, 15.0, 15.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.82135009765625, -4.6700439453125, -4.51873779296875, -4.367431640625, -4.21612548828125, -4.0648193359375, -3.91351318359375, -3.76220703125, -3.61090087890625, -3.4595947265625, -3.30828857421875, -3.156982421875, -3.00567626953125, -2.8543701171875, -2.70306396484375, -2.5517578125, -2.40045166015625, -2.2491455078125, -2.09783935546875, -1.946533203125, -1.79522705078125, -1.6439208984375, -1.49261474609375, -1.34130859375, -1.19000244140625, -1.0386962890625, -0.88739013671875, -0.736083984375, -0.58477783203125, -0.4334716796875, -0.28216552734375, -0.130859375, 0.02044677734375, 0.1717529296875, 0.32305908203125, 0.474365234375, 0.62567138671875, 0.7769775390625, 0.92828369140625, 1.07958984375, 1.23089599609375, 1.3822021484375, 1.53350830078125, 1.684814453125, 1.83612060546875, 1.9874267578125, 2.13873291015625, 2.2900390625, 2.44134521484375, 2.5926513671875, 2.74395751953125, 2.895263671875, 3.04656982421875, 3.1978759765625, 3.34918212890625, 3.50048828125, 3.65179443359375, 3.8031005859375, 3.95440673828125, 4.105712890625, 4.25701904296875, 4.4083251953125, 4.55963134765625, 4.7109375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 5.0, 5.0, 9.0, 14.0, 16.0, 20.0, 26.0, 36.0, 45.0, 44.0, 39.0, 70.0, 73.0, 72.0, 67.0, 65.0, 64.0, 69.0, 73.0, 56.0, 36.0, 30.0, 11.0, 20.0, 19.0, 8.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.57421875, -2.480010986328125, -2.38580322265625, -2.291595458984375, -2.1973876953125, -2.103179931640625, -2.00897216796875, -1.914764404296875, -1.820556640625, -1.726348876953125, -1.63214111328125, -1.537933349609375, -1.4437255859375, -1.349517822265625, -1.25531005859375, -1.161102294921875, -1.06689453125, -0.972686767578125, -0.87847900390625, -0.784271240234375, -0.6900634765625, -0.595855712890625, -0.50164794921875, -0.407440185546875, -0.313232421875, -0.219024658203125, -0.12481689453125, -0.030609130859375, 0.0635986328125, 0.157806396484375, 0.25201416015625, 0.346221923828125, 0.4404296875, 0.534637451171875, 0.62884521484375, 0.723052978515625, 0.8172607421875, 0.911468505859375, 1.00567626953125, 1.099884033203125, 1.194091796875, 1.288299560546875, 1.38250732421875, 1.476715087890625, 1.5709228515625, 1.665130615234375, 1.75933837890625, 1.853546142578125, 1.94775390625, 2.041961669921875, 2.13616943359375, 2.230377197265625, 2.3245849609375, 2.418792724609375, 2.51300048828125, 2.607208251953125, 2.701416015625, 2.795623779296875, 2.88983154296875, 2.984039306640625, 3.0782470703125, 3.172454833984375, 3.26666259765625, 3.360870361328125, 3.455078125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 9.0, 1.0, 4.0, 4.0, 5.0, 6.0, 5.0, 10.0, 18.0, 28.0, 32.0, 44.0, 89.0, 126.0, 231.0, 532.0, 1234.0, 4094.0, 20644.0, 284796.0, 3737378.0, 126474.0, 13511.0, 2979.0, 1018.0, 433.0, 229.0, 124.0, 73.0, 53.0, 26.0, 22.0, 13.0, 9.0, 15.0, 3.0, 7.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.015625, -4.8099365234375, -4.604248046875, -4.3985595703125, -4.19287109375, -3.9871826171875, -3.781494140625, -3.5758056640625, -3.3701171875, -3.1644287109375, -2.958740234375, -2.7530517578125, -2.54736328125, -2.3416748046875, -2.135986328125, -1.9302978515625, -1.724609375, -1.5189208984375, -1.313232421875, -1.1075439453125, -0.90185546875, -0.6961669921875, -0.490478515625, -0.2847900390625, -0.0791015625, 0.1265869140625, 0.332275390625, 0.5379638671875, 0.74365234375, 0.9493408203125, 1.155029296875, 1.3607177734375, 1.56640625, 1.7720947265625, 1.977783203125, 2.1834716796875, 2.38916015625, 2.5948486328125, 2.800537109375, 3.0062255859375, 3.2119140625, 3.4176025390625, 3.623291015625, 3.8289794921875, 4.03466796875, 4.2403564453125, 4.446044921875, 4.6517333984375, 4.857421875, 5.0631103515625, 5.268798828125, 5.4744873046875, 5.68017578125, 5.8858642578125, 6.091552734375, 6.2972412109375, 6.5029296875, 6.7086181640625, 6.914306640625, 7.1199951171875, 7.32568359375, 7.5313720703125, 7.737060546875, 7.9427490234375, 8.1484375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 5.0, 9.0, 7.0, 19.0, 23.0, 28.0, 57.0, 84.0, 134.0, 277.0, 458.0, 733.0, 832.0, 613.0, 301.0, 166.0, 95.0, 75.0, 41.0, 19.0, 16.0, 24.0, 15.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9560546875, -1.904754638671875, -1.85345458984375, -1.802154541015625, -1.7508544921875, -1.699554443359375, -1.64825439453125, -1.596954345703125, -1.545654296875, -1.494354248046875, -1.44305419921875, -1.391754150390625, -1.3404541015625, -1.289154052734375, -1.23785400390625, -1.186553955078125, -1.13525390625, -1.083953857421875, -1.03265380859375, -0.981353759765625, -0.9300537109375, -0.878753662109375, -0.82745361328125, -0.776153564453125, -0.724853515625, -0.673553466796875, -0.62225341796875, -0.570953369140625, -0.5196533203125, -0.468353271484375, -0.41705322265625, -0.365753173828125, -0.314453125, -0.263153076171875, -0.21185302734375, -0.160552978515625, -0.1092529296875, -0.057952880859375, -0.00665283203125, 0.044647216796875, 0.095947265625, 0.147247314453125, 0.19854736328125, 0.249847412109375, 0.3011474609375, 0.352447509765625, 0.40374755859375, 0.455047607421875, 0.50634765625, 0.557647705078125, 0.60894775390625, 0.660247802734375, 0.7115478515625, 0.762847900390625, 0.81414794921875, 0.865447998046875, 0.916748046875, 0.968048095703125, 1.01934814453125, 1.070648193359375, 1.1219482421875, 1.173248291015625, 1.22454833984375, 1.275848388671875, 1.3271484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 10.0, 10.0, 11.0, 40.0, 55.0, 97.0, 101.0, 137.0, 149.0, 135.0, 103.0, 65.0, 38.0, 22.0, 19.0, 7.0, 6.0, 0.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.758206367492676, -9.556876182556152, -9.355545997619629, -9.154215812683105, -8.952885627746582, -8.751554489135742, -8.550224304199219, -8.348894119262695, -8.147563934326172, -7.946233749389648, -7.744903564453125, -7.543572902679443, -7.34224271774292, -7.1409125328063965, -6.939582347869873, -6.738251686096191, -6.536921501159668, -6.3355913162231445, -6.134261131286621, -5.9329304695129395, -5.731600284576416, -5.530270099639893, -5.328939914703369, -5.1276092529296875, -4.926279544830322, -4.724949359893799, -4.523619174957275, -4.322288513183594, -4.12095832824707, -3.919628143310547, -3.7182979583740234, -3.516967535018921, -3.3156373500823975, -3.114307165145874, -2.9129767417907715, -2.711646556854248, -2.5103161334991455, -2.308985948562622, -2.1076555252075195, -1.906325340270996, -1.704995036125183, -1.5036647319793701, -1.3023344278335571, -1.1010041236877441, -0.8996738791465759, -0.6983436346054077, -0.4970133304595947, -0.29568302631378174, -0.09435272216796875, 0.10697756707668304, 0.30830785632133484, 0.5096381306648254, 0.7109684348106384, 0.9122986793518066, 1.1136289834976196, 1.3149592876434326, 1.5162895917892456, 1.7176198959350586, 1.9189502000808716, 2.1202805042266846, 2.321610689163208, 2.5229411125183105, 2.724271297454834, 2.9256014823913574, 3.12693190574646]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 9.0, 14.0, 14.0, 12.0, 12.0, 18.0, 25.0, 17.0, 24.0, 27.0, 34.0, 37.0, 34.0, 34.0, 30.0, 48.0, 34.0, 45.0, 46.0, 36.0, 51.0, 36.0, 42.0, 40.0, 29.0, 23.0, 38.0, 25.0, 18.0, 28.0, 18.0, 12.0, 11.0, 18.0, 15.0, 6.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.59322190284729, -2.51908278465271, -2.444943904876709, -2.370804786682129, -2.296665906906128, -2.222526788711548, -2.148387908935547, -2.074248790740967, -2.000109910964966, -1.9259709119796753, -1.8518319129943848, -1.7776929140090942, -1.7035539150238037, -1.6294149160385132, -1.5552759170532227, -1.4811367988586426, -1.406997799873352, -1.3328588008880615, -1.258719801902771, -1.1845808029174805, -1.11044180393219, -1.0363028049468994, -0.9621637463569641, -0.8880247473716736, -0.8138857483863831, -0.7397467494010925, -0.665607750415802, -0.5914686918258667, -0.5173296928405762, -0.44319072365760803, -0.3690516948699951, -0.2949126958847046, -0.22077369689941406, -0.14663469791412354, -0.07249568402767181, 0.0016433298587799072, 0.07578232884407043, 0.14992132782936096, 0.22406035661697388, 0.2981993556022644, 0.37233835458755493, 0.44647735357284546, 0.520616352558136, 0.5947554111480713, 0.6688944101333618, 0.7430334091186523, 0.8171724081039429, 0.8913114070892334, 0.9654504060745239, 1.0395894050598145, 1.113728404045105, 1.1878674030303955, 1.262006402015686, 1.3361454010009766, 1.4102845191955566, 1.4844233989715576, 1.5585625171661377, 1.6327015161514282, 1.7068405151367188, 1.7809795141220093, 1.8551185131072998, 1.9292575120925903, 2.003396511077881, 2.077535629272461, 2.151674509048462]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 8.0, 5.0, 6.0, 15.0, 26.0, 34.0, 45.0, 89.0, 166.0, 298.0, 642.0, 1639.0, 5305.0, 23226.0, 171338.0, 726884.0, 97122.0, 15354.0, 3911.0, 1291.0, 521.0, 275.0, 131.0, 89.0, 45.0, 32.0, 25.0, 15.0, 8.0, 7.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.86279296875, -0.8312759399414062, -0.7997589111328125, -0.7682418823242188, -0.736724853515625, -0.7052078247070312, -0.6736907958984375, -0.6421737670898438, -0.61065673828125, -0.5791397094726562, -0.5476226806640625, -0.5161056518554688, -0.484588623046875, -0.45307159423828125, -0.4215545654296875, -0.39003753662109375, -0.3585205078125, -0.32700347900390625, -0.2954864501953125, -0.26396942138671875, -0.232452392578125, -0.20093536376953125, -0.1694183349609375, -0.13790130615234375, -0.10638427734375, -0.07486724853515625, -0.0433502197265625, -0.01183319091796875, 0.019683837890625, 0.05120086669921875, 0.0827178955078125, 0.11423492431640625, 0.145751953125, 0.17726898193359375, 0.2087860107421875, 0.24030303955078125, 0.271820068359375, 0.30333709716796875, 0.3348541259765625, 0.36637115478515625, 0.39788818359375, 0.42940521240234375, 0.4609222412109375, 0.49243927001953125, 0.523956298828125, 0.5554733276367188, 0.5869903564453125, 0.6185073852539062, 0.6500244140625, 0.6815414428710938, 0.7130584716796875, 0.7445755004882812, 0.776092529296875, 0.8076095581054688, 0.8391265869140625, 0.8706436157226562, 0.90216064453125, 0.9336776733398438, 0.9651947021484375, 0.9967117309570312, 1.028228759765625, 1.0597457885742188, 1.0912628173828125, 1.1227798461914062, 1.154296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 10.0, 12.0, 9.0, 17.0, 24.0, 25.0, 38.0, 41.0, 57.0, 52.0, 58.0, 63.0, 66.0, 67.0, 57.0, 66.0, 58.0, 56.0, 44.0, 50.0, 30.0, 24.0, 31.0, 20.0, 14.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6240234375, -1.5547637939453125, -1.485504150390625, -1.4162445068359375, -1.34698486328125, -1.2777252197265625, -1.208465576171875, -1.1392059326171875, -1.0699462890625, -1.0006866455078125, -0.931427001953125, -0.8621673583984375, -0.79290771484375, -0.7236480712890625, -0.654388427734375, -0.5851287841796875, -0.515869140625, -0.4466094970703125, -0.377349853515625, -0.3080902099609375, -0.23883056640625, -0.1695709228515625, -0.100311279296875, -0.0310516357421875, 0.0382080078125, 0.1074676513671875, 0.176727294921875, 0.2459869384765625, 0.31524658203125, 0.3845062255859375, 0.453765869140625, 0.5230255126953125, 0.59228515625, 0.6615447998046875, 0.730804443359375, 0.8000640869140625, 0.86932373046875, 0.9385833740234375, 1.007843017578125, 1.0771026611328125, 1.1463623046875, 1.2156219482421875, 1.284881591796875, 1.3541412353515625, 1.42340087890625, 1.4926605224609375, 1.561920166015625, 1.6311798095703125, 1.700439453125, 1.7696990966796875, 1.838958740234375, 1.9082183837890625, 1.97747802734375, 2.0467376708984375, 2.115997314453125, 2.1852569580078125, 2.2545166015625, 2.3237762451171875, 2.393035888671875, 2.4622955322265625, 2.53155517578125, 2.6008148193359375, 2.670074462890625, 2.7393341064453125, 2.80859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 4.0, 6.0, 5.0, 12.0, 18.0, 28.0, 43.0, 49.0, 71.0, 120.0, 160.0, 255.0, 371.0, 617.0, 969.0, 1562.0, 2654.0, 4455.0, 7602.0, 13430.0, 24891.0, 48346.0, 105628.0, 260796.0, 318582.0, 133145.0, 58588.0, 28957.0, 15459.0, 8743.0, 5159.0, 2916.0, 1767.0, 1149.0, 680.0, 431.0, 291.0, 188.0, 103.0, 82.0, 68.0, 41.0, 36.0, 24.0, 14.0, 12.0, 5.0, 1.0, 7.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.187255859375, -0.18104171752929688, -0.17482757568359375, -0.16861343383789062, -0.1623992919921875, -0.15618515014648438, -0.14997100830078125, -0.14375686645507812, -0.137542724609375, -0.13132858276367188, -0.12511444091796875, -0.11890029907226562, -0.1126861572265625, -0.10647201538085938, -0.10025787353515625, -0.09404373168945312, -0.08782958984375, -0.08161544799804688, -0.07540130615234375, -0.06918716430664062, -0.0629730224609375, -0.056758880615234375, -0.05054473876953125, -0.044330596923828125, -0.038116455078125, -0.031902313232421875, -0.02568817138671875, -0.019474029541015625, -0.0132598876953125, -0.007045745849609375, -0.00083160400390625, 0.005382537841796875, 0.0115966796875, 0.017810821533203125, 0.02402496337890625, 0.030239105224609375, 0.0364532470703125, 0.042667388916015625, 0.04888153076171875, 0.055095672607421875, 0.061309814453125, 0.06752395629882812, 0.07373809814453125, 0.07995223999023438, 0.0861663818359375, 0.09238052368164062, 0.09859466552734375, 0.10480880737304688, 0.11102294921875, 0.11723709106445312, 0.12345123291015625, 0.12966537475585938, 0.1358795166015625, 0.14209365844726562, 0.14830780029296875, 0.15452194213867188, 0.160736083984375, 0.16695022583007812, 0.17316436767578125, 0.17937850952148438, 0.1855926513671875, 0.19180679321289062, 0.19802093505859375, 0.20423507690429688, 0.21044921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 18.0, 10.0, 13.0, 15.0, 18.0, 20.0, 27.0, 24.0, 37.0, 34.0, 49.0, 45.0, 56.0, 59.0, 54.0, 53.0, 45.0, 41.0, 46.0, 35.0, 40.0, 41.0, 22.0, 23.0, 17.0, 14.0, 19.0, 25.0, 18.0, 12.0, 9.0, 6.0, 6.0, 7.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.427734375, -3.326934814453125, -3.22613525390625, -3.125335693359375, -3.0245361328125, -2.923736572265625, -2.82293701171875, -2.722137451171875, -2.621337890625, -2.520538330078125, -2.41973876953125, -2.318939208984375, -2.2181396484375, -2.117340087890625, -2.01654052734375, -1.915740966796875, -1.81494140625, -1.714141845703125, -1.61334228515625, -1.512542724609375, -1.4117431640625, -1.310943603515625, -1.21014404296875, -1.109344482421875, -1.008544921875, -0.907745361328125, -0.80694580078125, -0.706146240234375, -0.6053466796875, -0.504547119140625, -0.40374755859375, -0.302947998046875, -0.2021484375, -0.101348876953125, -0.00054931640625, 0.100250244140625, 0.2010498046875, 0.301849365234375, 0.40264892578125, 0.503448486328125, 0.604248046875, 0.705047607421875, 0.80584716796875, 0.906646728515625, 1.0074462890625, 1.108245849609375, 1.20904541015625, 1.309844970703125, 1.41064453125, 1.511444091796875, 1.61224365234375, 1.713043212890625, 1.8138427734375, 1.914642333984375, 2.01544189453125, 2.116241455078125, 2.217041015625, 2.317840576171875, 2.41864013671875, 2.519439697265625, 2.6202392578125, 2.721038818359375, 2.82183837890625, 2.922637939453125, 3.0234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 7.0, 12.0, 17.0, 31.0, 60.0, 65.0, 119.0, 193.0, 375.0, 891.0, 3486.0, 22819.0, 574789.0, 420978.0, 20051.0, 3079.0, 783.0, 329.0, 162.0, 102.0, 71.0, 50.0, 27.0, 14.0, 15.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1370849609375, -0.1331644058227539, -0.1292438507080078, -0.12532329559326172, -0.12140274047851562, -0.11748218536376953, -0.11356163024902344, -0.10964107513427734, -0.10572052001953125, -0.10179996490478516, -0.09787940979003906, -0.09395885467529297, -0.09003829956054688, -0.08611774444580078, -0.08219718933105469, -0.0782766342163086, -0.0743560791015625, -0.0704355239868164, -0.06651496887207031, -0.06259441375732422, -0.058673858642578125, -0.05475330352783203, -0.05083274841308594, -0.046912193298339844, -0.04299163818359375, -0.039071083068847656, -0.03515052795410156, -0.03122997283935547, -0.027309417724609375, -0.02338886260986328, -0.019468307495117188, -0.015547752380371094, -0.011627197265625, -0.007706642150878906, -0.0037860870361328125, 0.00013446807861328125, 0.004055023193359375, 0.007975578308105469, 0.011896133422851562, 0.015816688537597656, 0.01973724365234375, 0.023657798767089844, 0.027578353881835938, 0.03149890899658203, 0.035419464111328125, 0.03934001922607422, 0.04326057434082031, 0.047181129455566406, 0.0511016845703125, 0.055022239685058594, 0.05894279479980469, 0.06286334991455078, 0.06678390502929688, 0.07070446014404297, 0.07462501525878906, 0.07854557037353516, 0.08246612548828125, 0.08638668060302734, 0.09030723571777344, 0.09422779083251953, 0.09814834594726562, 0.10206890106201172, 0.10598945617675781, 0.1099100112915039, 0.11383056640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 2.0, 3.0, 6.0, 9.0, 15.0, 33.0, 29.0, 51.0, 61.0, 84.0, 121.0, 118.0, 113.0, 116.0, 64.0, 57.0, 41.0, 32.0, 13.0, 12.0, 9.0, 1.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1425228118896484e-05, -3.9662234485149384e-05, -3.789924085140228e-05, -3.613624721765518e-05, -3.437325358390808e-05, -3.261025995016098e-05, -3.084726631641388e-05, -2.908427268266678e-05, -2.7321279048919678e-05, -2.5558285415172577e-05, -2.3795291781425476e-05, -2.2032298147678375e-05, -2.0269304513931274e-05, -1.8506310880184174e-05, -1.6743317246437073e-05, -1.4980323612689972e-05, -1.3217329978942871e-05, -1.145433634519577e-05, -9.69134271144867e-06, -7.928349077701569e-06, -6.165355443954468e-06, -4.402361810207367e-06, -2.639368176460266e-06, -8.763745427131653e-07, 8.866190910339355e-07, 2.6496127247810364e-06, 4.412606358528137e-06, 6.175599992275238e-06, 7.938593626022339e-06, 9.70158725976944e-06, 1.146458089351654e-05, 1.3227574527263641e-05, 1.4990568161010742e-05, 1.6753561794757843e-05, 1.8516555428504944e-05, 2.0279549062252045e-05, 2.2042542695999146e-05, 2.3805536329746246e-05, 2.5568529963493347e-05, 2.7331523597240448e-05, 2.909451723098755e-05, 3.085751086473465e-05, 3.262050449848175e-05, 3.438349813222885e-05, 3.614649176597595e-05, 3.790948539972305e-05, 3.9672479033470154e-05, 4.1435472667217255e-05, 4.3198466300964355e-05, 4.4961459934711456e-05, 4.672445356845856e-05, 4.848744720220566e-05, 5.025044083595276e-05, 5.201343446969986e-05, 5.377642810344696e-05, 5.553942173719406e-05, 5.730241537094116e-05, 5.906540900468826e-05, 6.0828402638435364e-05, 6.259139627218246e-05, 6.435438990592957e-05, 6.611738353967667e-05, 6.788037717342377e-05, 6.964337080717087e-05, 7.140636444091797e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 11.0, 15.0, 37.0, 63.0, 117.0, 255.0, 580.0, 1667.0, 5355.0, 27869.0, 645080.0, 339502.0, 21204.0, 4391.0, 1408.0, 542.0, 221.0, 96.0, 59.0, 22.0, 20.0, 11.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1578369140625, -0.1531848907470703, -0.14853286743164062, -0.14388084411621094, -0.13922882080078125, -0.13457679748535156, -0.12992477416992188, -0.1252727508544922, -0.1206207275390625, -0.11596870422363281, -0.11131668090820312, -0.10666465759277344, -0.10201263427734375, -0.09736061096191406, -0.09270858764648438, -0.08805656433105469, -0.083404541015625, -0.07875251770019531, -0.07410049438476562, -0.06944847106933594, -0.06479644775390625, -0.06014442443847656, -0.055492401123046875, -0.05084037780761719, -0.0461883544921875, -0.04153633117675781, -0.036884307861328125, -0.03223228454589844, -0.02758026123046875, -0.022928237915039062, -0.018276214599609375, -0.013624191284179688, -0.00897216796875, -0.0043201446533203125, 0.000331878662109375, 0.0049839019775390625, 0.00963592529296875, 0.014287948608398438, 0.018939971923828125, 0.023591995239257812, 0.0282440185546875, 0.03289604187011719, 0.037548065185546875, 0.04220008850097656, 0.04685211181640625, 0.05150413513183594, 0.056156158447265625, 0.06080818176269531, 0.065460205078125, 0.07011222839355469, 0.07476425170898438, 0.07941627502441406, 0.08406829833984375, 0.08872032165527344, 0.09337234497070312, 0.09802436828613281, 0.1026763916015625, 0.10732841491699219, 0.11198043823242188, 0.11663246154785156, 0.12128448486328125, 0.12593650817871094, 0.13058853149414062, 0.1352405548095703, 0.139892578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 9.0, 10.0, 10.0, 24.0, 41.0, 115.0, 326.0, 258.0, 81.0, 41.0, 26.0, 14.0, 11.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.03790283203125, -0.03695273399353027, -0.03600263595581055, -0.03505253791809082, -0.034102439880371094, -0.03315234184265137, -0.03220224380493164, -0.031252145767211914, -0.030302047729492188, -0.02935194969177246, -0.028401851654052734, -0.027451753616333008, -0.02650165557861328, -0.025551557540893555, -0.024601459503173828, -0.0236513614654541, -0.022701263427734375, -0.02175116539001465, -0.020801067352294922, -0.019850969314575195, -0.01890087127685547, -0.017950773239135742, -0.017000675201416016, -0.01605057716369629, -0.015100479125976562, -0.014150381088256836, -0.01320028305053711, -0.012250185012817383, -0.011300086975097656, -0.01034998893737793, -0.009399890899658203, -0.008449792861938477, -0.00749969482421875, -0.0065495967864990234, -0.005599498748779297, -0.00464940071105957, -0.0036993026733398438, -0.002749204635620117, -0.0017991065979003906, -0.0008490085601806641, 0.0001010894775390625, 0.001051187515258789, 0.0020012855529785156, 0.002951383590698242, 0.0039014816284179688, 0.004851579666137695, 0.005801677703857422, 0.0067517757415771484, 0.007701873779296875, 0.008651971817016602, 0.009602069854736328, 0.010552167892456055, 0.011502265930175781, 0.012452363967895508, 0.013402462005615234, 0.014352560043334961, 0.015302658081054688, 0.016252756118774414, 0.01720285415649414, 0.018152952194213867, 0.019103050231933594, 0.02005314826965332, 0.021003246307373047, 0.021953344345092773, 0.0229034423828125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 14.0, 20.0, 36.0, 52.0, 78.0, 103.0, 121.0, 134.0, 130.0, 96.0, 73.0, 61.0, 33.0, 13.0, 14.0, 10.0, 5.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1637420654296875, -4.063394069671631, -3.9630463123321533, -3.862698554992676, -3.762350559234619, -3.6620028018951416, -3.561655044555664, -3.4613070487976074, -3.360959053039551, -3.2606112957000732, -3.1602632999420166, -3.059915542602539, -2.9595675468444824, -2.859219789505005, -2.7588720321655273, -2.6585240364074707, -2.558176279067993, -2.4578285217285156, -2.357480525970459, -2.2571327686309814, -2.156784772872925, -2.0564370155334473, -1.9560891389846802, -1.855741262435913, -1.755393385887146, -1.655045509338379, -1.5546976327896118, -1.4543497562408447, -1.3540019989013672, -1.2536540031433105, -1.153306245803833, -1.052958369255066, -0.9526102542877197, -0.8522623777389526, -0.7519145011901855, -0.6515666842460632, -0.5512188076972961, -0.45087093114852905, -0.35052311420440674, -0.25017523765563965, -0.14982736110687256, -0.04947949945926666, 0.05086836218833923, 0.15121620893478394, 0.251564085483551, 0.3519119620323181, 0.45225977897644043, 0.5526076555252075, 0.6529555320739746, 0.7533034086227417, 0.8536512851715088, 0.9539991021156311, 1.054347038269043, 1.1546947956085205, 1.2550426721572876, 1.3553905487060547, 1.4557384252548218, 1.5560863018035889, 1.656434178352356, 1.756782054901123, 1.8571298122406006, 1.9574778079986572, 2.0578255653381348, 2.1581735610961914, 2.258521318435669]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 12.0, 11.0, 19.0, 12.0, 26.0, 21.0, 24.0, 27.0, 39.0, 37.0, 37.0, 44.0, 40.0, 48.0, 51.0, 46.0, 50.0, 53.0, 47.0, 53.0, 35.0, 34.0, 38.0, 30.0, 25.0, 24.0, 25.0, 12.0, 16.0, 15.0, 12.0, 10.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.6357100009918213, -1.5870754718780518, -1.5384409427642822, -1.4898064136505127, -1.4411718845367432, -1.3925373554229736, -1.343902826309204, -1.2952682971954346, -1.246633768081665, -1.1979992389678955, -1.149364709854126, -1.1007301807403564, -1.052095651626587, -1.0034611225128174, -0.9548265933990479, -0.9061920642852783, -0.8575575351715088, -0.8089230060577393, -0.7602884769439697, -0.7116539478302002, -0.6630194187164307, -0.6143848896026611, -0.5657503604888916, -0.5171158313751221, -0.46848130226135254, -0.419846773147583, -0.3712122440338135, -0.32257771492004395, -0.2739431858062744, -0.22530865669250488, -0.17667412757873535, -0.12803959846496582, -0.07940518856048584, -0.03077065944671631, 0.017863869667053223, 0.06649839878082275, 0.11513292789459229, 0.16376745700836182, 0.21240198612213135, 0.2610365152359009, 0.3096710443496704, 0.35830557346343994, 0.4069401025772095, 0.455574631690979, 0.5042091608047485, 0.5528436899185181, 0.6014782190322876, 0.6501127481460571, 0.6987472772598267, 0.7473818063735962, 0.7960163354873657, 0.8446508646011353, 0.8932853937149048, 0.9419199228286743, 0.9905544519424438, 1.0391889810562134, 1.087823510169983, 1.1364580392837524, 1.185092568397522, 1.2337270975112915, 1.282361626625061, 1.3309961557388306, 1.3796306848526, 1.4282652139663696, 1.4768997430801392]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 9.0, 10.0, 21.0, 25.0, 30.0, 50.0, 100.0, 177.0, 402.0, 875.0, 2080.0, 5508.0, 17627.0, 62799.0, 285379.0, 505220.0, 122474.0, 30921.0, 9306.0, 3132.0, 1237.0, 531.0, 269.0, 132.0, 93.0, 46.0, 34.0, 29.0, 10.0, 6.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.419921875, -2.342437744140625, -2.26495361328125, -2.187469482421875, -2.1099853515625, -2.032501220703125, -1.95501708984375, -1.877532958984375, -1.800048828125, -1.722564697265625, -1.64508056640625, -1.567596435546875, -1.4901123046875, -1.412628173828125, -1.33514404296875, -1.257659912109375, -1.18017578125, -1.102691650390625, -1.02520751953125, -0.947723388671875, -0.8702392578125, -0.792755126953125, -0.71527099609375, -0.637786865234375, -0.560302734375, -0.482818603515625, -0.40533447265625, -0.327850341796875, -0.2503662109375, -0.172882080078125, -0.09539794921875, -0.017913818359375, 0.0595703125, 0.137054443359375, 0.21453857421875, 0.292022705078125, 0.3695068359375, 0.446990966796875, 0.52447509765625, 0.601959228515625, 0.679443359375, 0.756927490234375, 0.83441162109375, 0.911895751953125, 0.9893798828125, 1.066864013671875, 1.14434814453125, 1.221832275390625, 1.29931640625, 1.376800537109375, 1.45428466796875, 1.531768798828125, 1.6092529296875, 1.686737060546875, 1.76422119140625, 1.841705322265625, 1.919189453125, 1.996673583984375, 2.07415771484375, 2.151641845703125, 2.2291259765625, 2.306610107421875, 2.38409423828125, 2.461578369140625, 2.5390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 8.0, 12.0, 15.0, 22.0, 16.0, 40.0, 29.0, 40.0, 44.0, 44.0, 55.0, 57.0, 65.0, 56.0, 89.0, 55.0, 64.0, 64.0, 39.0, 32.0, 43.0, 24.0, 24.0, 20.0, 18.0, 13.0, 9.0, 6.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.4453125, -6.294158935546875, -6.14300537109375, -5.991851806640625, -5.8406982421875, -5.689544677734375, -5.53839111328125, -5.387237548828125, -5.236083984375, -5.084930419921875, -4.93377685546875, -4.782623291015625, -4.6314697265625, -4.480316162109375, -4.32916259765625, -4.178009033203125, -4.02685546875, -3.875701904296875, -3.72454833984375, -3.573394775390625, -3.4222412109375, -3.271087646484375, -3.11993408203125, -2.968780517578125, -2.817626953125, -2.666473388671875, -2.51531982421875, -2.364166259765625, -2.2130126953125, -2.061859130859375, -1.91070556640625, -1.759552001953125, -1.6083984375, -1.457244873046875, -1.30609130859375, -1.154937744140625, -1.0037841796875, -0.852630615234375, -0.70147705078125, -0.550323486328125, -0.399169921875, -0.248016357421875, -0.09686279296875, 0.054290771484375, 0.2054443359375, 0.356597900390625, 0.50775146484375, 0.658905029296875, 0.81005859375, 0.961212158203125, 1.11236572265625, 1.263519287109375, 1.4146728515625, 1.565826416015625, 1.71697998046875, 1.868133544921875, 2.019287109375, 2.170440673828125, 2.32159423828125, 2.472747802734375, 2.6239013671875, 2.775054931640625, 2.92620849609375, 3.077362060546875, 3.228515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 19.0, 16.0, 17.0, 34.0, 46.0, 60.0, 81.0, 125.0, 207.0, 494.0, 1500.0, 6261.0, 36205.0, 327484.0, 597034.0, 65173.0, 10281.0, 2109.0, 630.0, 248.0, 166.0, 99.0, 58.0, 59.0, 36.0, 21.0, 18.0, 20.0, 7.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.32421875, -3.20611572265625, -3.0880126953125, -2.96990966796875, -2.851806640625, -2.73370361328125, -2.6156005859375, -2.49749755859375, -2.37939453125, -2.26129150390625, -2.1431884765625, -2.02508544921875, -1.906982421875, -1.78887939453125, -1.6707763671875, -1.55267333984375, -1.4345703125, -1.31646728515625, -1.1983642578125, -1.08026123046875, -0.962158203125, -0.84405517578125, -0.7259521484375, -0.60784912109375, -0.48974609375, -0.37164306640625, -0.2535400390625, -0.13543701171875, -0.017333984375, 0.10076904296875, 0.2188720703125, 0.33697509765625, 0.455078125, 0.57318115234375, 0.6912841796875, 0.80938720703125, 0.927490234375, 1.04559326171875, 1.1636962890625, 1.28179931640625, 1.39990234375, 1.51800537109375, 1.6361083984375, 1.75421142578125, 1.872314453125, 1.99041748046875, 2.1085205078125, 2.22662353515625, 2.3447265625, 2.46282958984375, 2.5809326171875, 2.69903564453125, 2.817138671875, 2.93524169921875, 3.0533447265625, 3.17144775390625, 3.28955078125, 3.40765380859375, 3.5257568359375, 3.64385986328125, 3.761962890625, 3.88006591796875, 3.9981689453125, 4.11627197265625, 4.234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 15.0, 12.0, 25.0, 19.0, 32.0, 24.0, 33.0, 63.0, 59.0, 63.0, 71.0, 54.0, 79.0, 63.0, 65.0, 58.0, 38.0, 55.0, 32.0, 25.0, 27.0, 22.0, 15.0, 10.0, 10.0, 7.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.3355712890625, -5.159423828125, -4.9832763671875, -4.80712890625, -4.6309814453125, -4.454833984375, -4.2786865234375, -4.1025390625, -3.9263916015625, -3.750244140625, -3.5740966796875, -3.39794921875, -3.2218017578125, -3.045654296875, -2.8695068359375, -2.693359375, -2.5172119140625, -2.341064453125, -2.1649169921875, -1.98876953125, -1.8126220703125, -1.636474609375, -1.4603271484375, -1.2841796875, -1.1080322265625, -0.931884765625, -0.7557373046875, -0.57958984375, -0.4034423828125, -0.227294921875, -0.0511474609375, 0.125, 0.3011474609375, 0.477294921875, 0.6534423828125, 0.82958984375, 1.0057373046875, 1.181884765625, 1.3580322265625, 1.5341796875, 1.7103271484375, 1.886474609375, 2.0626220703125, 2.23876953125, 2.4149169921875, 2.591064453125, 2.7672119140625, 2.943359375, 3.1195068359375, 3.295654296875, 3.4718017578125, 3.64794921875, 3.8240966796875, 4.000244140625, 4.1763916015625, 4.3525390625, 4.5286865234375, 4.704833984375, 4.8809814453125, 5.05712890625, 5.2332763671875, 5.409423828125, 5.5855712890625, 5.76171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 2.0, 6.0, 9.0, 14.0, 12.0, 24.0, 34.0, 56.0, 104.0, 169.0, 411.0, 1029.0, 3528.0, 17038.0, 152775.0, 751230.0, 104449.0, 13117.0, 2883.0, 884.0, 352.0, 155.0, 94.0, 46.0, 32.0, 32.0, 16.0, 9.0, 7.0, 5.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0, -0.971771240234375, -0.94354248046875, -0.915313720703125, -0.8870849609375, -0.858856201171875, -0.83062744140625, -0.802398681640625, -0.774169921875, -0.745941162109375, -0.71771240234375, -0.689483642578125, -0.6612548828125, -0.633026123046875, -0.60479736328125, -0.576568603515625, -0.54833984375, -0.520111083984375, -0.49188232421875, -0.463653564453125, -0.4354248046875, -0.407196044921875, -0.37896728515625, -0.350738525390625, -0.322509765625, -0.294281005859375, -0.26605224609375, -0.237823486328125, -0.2095947265625, -0.181365966796875, -0.15313720703125, -0.124908447265625, -0.0966796875, -0.068450927734375, -0.04022216796875, -0.011993408203125, 0.0162353515625, 0.044464111328125, 0.07269287109375, 0.100921630859375, 0.129150390625, 0.157379150390625, 0.18560791015625, 0.213836669921875, 0.2420654296875, 0.270294189453125, 0.29852294921875, 0.326751708984375, 0.35498046875, 0.383209228515625, 0.41143798828125, 0.439666748046875, 0.4678955078125, 0.496124267578125, 0.52435302734375, 0.552581787109375, 0.580810546875, 0.609039306640625, 0.63726806640625, 0.665496826171875, 0.6937255859375, 0.721954345703125, 0.75018310546875, 0.778411865234375, 0.806640625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 6.0, 12.0, 15.0, 24.0, 34.0, 41.0, 52.0, 80.0, 91.0, 109.0, 146.0, 107.0, 68.0, 51.0, 44.0, 29.0, 23.0, 13.0, 11.0, 12.0, 7.0, 9.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010287761688232422, -9.935349225997925e-05, -9.582936763763428e-05, -9.23052430152893e-05, -8.878111839294434e-05, -8.525699377059937e-05, -8.17328691482544e-05, -7.820874452590942e-05, -7.468461990356445e-05, -7.116049528121948e-05, -6.763637065887451e-05, -6.411224603652954e-05, -6.058812141418457e-05, -5.70639967918396e-05, -5.353987216949463e-05, -5.001574754714966e-05, -4.649162292480469e-05, -4.296749830245972e-05, -3.9443373680114746e-05, -3.5919249057769775e-05, -3.2395124435424805e-05, -2.8870999813079834e-05, -2.5346875190734863e-05, -2.1822750568389893e-05, -1.8298625946044922e-05, -1.4774501323699951e-05, -1.125037670135498e-05, -7.72625207901001e-06, -4.202127456665039e-06, -6.780028343200684e-07, 2.8461217880249023e-06, 6.370246410369873e-06, 9.894371032714844e-06, 1.3418495655059814e-05, 1.6942620277404785e-05, 2.0466744899749756e-05, 2.3990869522094727e-05, 2.7514994144439697e-05, 3.103911876678467e-05, 3.456324338912964e-05, 3.808736801147461e-05, 4.161149263381958e-05, 4.513561725616455e-05, 4.865974187850952e-05, 5.218386650085449e-05, 5.570799112319946e-05, 5.9232115745544434e-05, 6.27562403678894e-05, 6.628036499023438e-05, 6.980448961257935e-05, 7.332861423492432e-05, 7.685273885726929e-05, 8.037686347961426e-05, 8.390098810195923e-05, 8.74251127243042e-05, 9.094923734664917e-05, 9.447336196899414e-05, 9.799748659133911e-05, 0.00010152161121368408, 0.00010504573583602905, 0.00010856986045837402, 0.000112093985080719, 0.00011561810970306396, 0.00011914223432540894, 0.0001226663589477539]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 0.0, 2.0, 7.0, 17.0, 19.0, 26.0, 61.0, 92.0, 152.0, 249.0, 446.0, 810.0, 1668.0, 3966.0, 13729.0, 91686.0, 734591.0, 171248.0, 20375.0, 5220.0, 1964.0, 944.0, 504.0, 300.0, 178.0, 121.0, 72.0, 39.0, 31.0, 10.0, 11.0, 10.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1591796875, -1.125701904296875, -1.09222412109375, -1.058746337890625, -1.0252685546875, -0.991790771484375, -0.95831298828125, -0.924835205078125, -0.891357421875, -0.857879638671875, -0.82440185546875, -0.790924072265625, -0.7574462890625, -0.723968505859375, -0.69049072265625, -0.657012939453125, -0.62353515625, -0.590057373046875, -0.55657958984375, -0.523101806640625, -0.4896240234375, -0.456146240234375, -0.42266845703125, -0.389190673828125, -0.355712890625, -0.322235107421875, -0.28875732421875, -0.255279541015625, -0.2218017578125, -0.188323974609375, -0.15484619140625, -0.121368408203125, -0.087890625, -0.054412841796875, -0.02093505859375, 0.012542724609375, 0.0460205078125, 0.079498291015625, 0.11297607421875, 0.146453857421875, 0.179931640625, 0.213409423828125, 0.24688720703125, 0.280364990234375, 0.3138427734375, 0.347320556640625, 0.38079833984375, 0.414276123046875, 0.44775390625, 0.481231689453125, 0.51470947265625, 0.548187255859375, 0.5816650390625, 0.615142822265625, 0.64862060546875, 0.682098388671875, 0.715576171875, 0.749053955078125, 0.78253173828125, 0.816009521484375, 0.8494873046875, 0.882965087890625, 0.91644287109375, 0.949920654296875, 0.9833984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 16.0, 20.0, 24.0, 35.0, 67.0, 79.0, 113.0, 175.0, 144.0, 90.0, 80.0, 70.0, 26.0, 19.0, 16.0, 8.0, 7.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5036087036132812, -0.4867095947265625, -0.46981048583984375, -0.452911376953125, -0.43601226806640625, -0.4191131591796875, -0.40221405029296875, -0.38531494140625, -0.36841583251953125, -0.3515167236328125, -0.33461761474609375, -0.317718505859375, -0.30081939697265625, -0.2839202880859375, -0.26702117919921875, -0.2501220703125, -0.23322296142578125, -0.2163238525390625, -0.19942474365234375, -0.182525634765625, -0.16562652587890625, -0.1487274169921875, -0.13182830810546875, -0.11492919921875, -0.09803009033203125, -0.0811309814453125, -0.06423187255859375, -0.047332763671875, -0.03043365478515625, -0.0135345458984375, 0.00336456298828125, 0.020263671875, 0.03716278076171875, 0.0540618896484375, 0.07096099853515625, 0.087860107421875, 0.10475921630859375, 0.1216583251953125, 0.13855743408203125, 0.15545654296875, 0.17235565185546875, 0.1892547607421875, 0.20615386962890625, 0.223052978515625, 0.23995208740234375, 0.2568511962890625, 0.27375030517578125, 0.2906494140625, 0.30754852294921875, 0.3244476318359375, 0.34134674072265625, 0.358245849609375, 0.37514495849609375, 0.3920440673828125, 0.40894317626953125, 0.42584228515625, 0.44274139404296875, 0.4596405029296875, 0.47653961181640625, 0.493438720703125, 0.5103378295898438, 0.5272369384765625, 0.5441360473632812, 0.56103515625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 38.0, 106.0, 278.0, 310.0, 186.0, 51.0, 24.0, 8.0, 5.0, 1.0, 1.0], "bins": [-30.301959991455078, -29.763917922973633, -29.225875854492188, -28.687835693359375, -28.14979362487793, -27.611751556396484, -27.07370948791504, -26.535667419433594, -25.99762725830078, -25.459585189819336, -24.92154312133789, -24.383502960205078, -23.845460891723633, -23.307418823242188, -22.769376754760742, -22.231334686279297, -21.69329261779785, -21.155250549316406, -20.61720848083496, -20.07916831970215, -19.541126251220703, -19.003084182739258, -18.465042114257812, -17.927000045776367, -17.388957977294922, -16.850915908813477, -16.31287384033203, -15.774832725524902, -15.236791610717773, -14.698749542236328, -14.160707473754883, -13.622665405273438, -13.084625244140625, -12.54658317565918, -12.00854206085205, -11.470499992370605, -10.932458877563477, -10.394416809082031, -9.856374740600586, -9.31833267211914, -8.780291557312012, -8.242249488830566, -7.7042083740234375, -7.166166305541992, -6.628124713897705, -6.090083122253418, -5.552041053771973, -5.0139994621276855, -4.475957870483398, -3.9379162788391113, -3.399874448776245, -2.861832618713379, -2.323791027069092, -1.7857494354248047, -1.2477076053619385, -0.7096657752990723, -0.17162418365478516, 0.3664175271987915, 0.9044592380523682, 1.4425009489059448, 1.9805426597595215, 2.5185842514038086, 3.056626081466675, 3.594667911529541, 4.132709503173828]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 8.0, 9.0, 7.0, 5.0, 16.0, 17.0, 18.0, 19.0, 24.0, 31.0, 31.0, 33.0, 32.0, 32.0, 34.0, 41.0, 44.0, 40.0, 29.0, 34.0, 27.0, 34.0, 41.0, 43.0, 38.0, 28.0, 34.0, 30.0, 35.0, 22.0, 17.0, 17.0, 17.0, 22.0, 15.0, 7.0, 10.0, 4.0, 7.0, 7.0, 8.0, 4.0, 3.0, 0.0, 1.0, 4.0], "bins": [-6.742868900299072, -6.559817314147949, -6.376765727996826, -6.193714141845703, -6.01066255569458, -5.827610969543457, -5.644558906555176, -5.461507797241211, -5.27845573425293, -5.095404148101807, -4.912352561950684, -4.7293009757995605, -4.5462493896484375, -4.3631978034973145, -4.180146217346191, -3.9970943927764893, -3.8140430450439453, -3.6309914588928223, -3.447939872741699, -3.264888286590576, -3.081836700439453, -2.89878511428833, -2.715733289718628, -2.532681703567505, -2.349630117416382, -2.166578531265259, -1.9835269451141357, -1.8004752397537231, -1.6174236536026, -1.434372067451477, -1.2513203620910645, -1.0682687759399414, -0.8852167129516602, -0.7021651268005371, -0.5191134810447693, -0.33606183528900146, -0.15301024913787842, 0.03004133701324463, 0.21309304237365723, 0.3961446285247803, 0.5791962146759033, 0.7622478008270264, 0.9452994465827942, 1.128351092338562, 1.311402678489685, 1.494454264640808, 1.6775059700012207, 1.8605575561523438, 2.043609142303467, 2.22666072845459, 2.409712314605713, 2.592763900756836, 2.775815486907959, 2.958867073059082, 3.141918897628784, 3.3249704837799072, 3.5080220699310303, 3.6910736560821533, 3.8741252422332764, 4.0571770668029785, 4.240228652954102, 4.423280239105225, 4.606331825256348, 4.789383411407471, 4.972434997558594]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 5.0, 10.0, 9.0, 12.0, 17.0, 24.0, 35.0, 44.0, 66.0, 85.0, 182.0, 357.0, 869.0, 2715.0, 12493.0, 184248.0, 3791008.0, 184252.0, 13212.0, 2847.0, 948.0, 370.0, 168.0, 100.0, 63.0, 37.0, 35.0, 23.0, 13.0, 9.0, 9.0, 5.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.510498046875, -5.29443359375, -5.078369140625, -4.8623046875, -4.646240234375, -4.43017578125, -4.214111328125, -3.998046875, -3.781982421875, -3.56591796875, -3.349853515625, -3.1337890625, -2.917724609375, -2.70166015625, -2.485595703125, -2.26953125, -2.053466796875, -1.83740234375, -1.621337890625, -1.4052734375, -1.189208984375, -0.97314453125, -0.757080078125, -0.541015625, -0.324951171875, -0.10888671875, 0.107177734375, 0.3232421875, 0.539306640625, 0.75537109375, 0.971435546875, 1.1875, 1.403564453125, 1.61962890625, 1.835693359375, 2.0517578125, 2.267822265625, 2.48388671875, 2.699951171875, 2.916015625, 3.132080078125, 3.34814453125, 3.564208984375, 3.7802734375, 3.996337890625, 4.21240234375, 4.428466796875, 4.64453125, 4.860595703125, 5.07666015625, 5.292724609375, 5.5087890625, 5.724853515625, 5.94091796875, 6.156982421875, 6.373046875, 6.589111328125, 6.80517578125, 7.021240234375, 7.2373046875, 7.453369140625, 7.66943359375, 7.885498046875, 8.1015625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 7.0, 8.0, 17.0, 16.0, 25.0, 16.0, 38.0, 46.0, 44.0, 61.0, 73.0, 72.0, 73.0, 70.0, 79.0, 67.0, 45.0, 41.0, 47.0, 33.0, 30.0, 20.0, 29.0, 17.0, 9.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.244140625, -3.162841796875, -3.08154296875, -3.000244140625, -2.9189453125, -2.837646484375, -2.75634765625, -2.675048828125, -2.59375, -2.512451171875, -2.43115234375, -2.349853515625, -2.2685546875, -2.187255859375, -2.10595703125, -2.024658203125, -1.943359375, -1.862060546875, -1.78076171875, -1.699462890625, -1.6181640625, -1.536865234375, -1.45556640625, -1.374267578125, -1.29296875, -1.211669921875, -1.13037109375, -1.049072265625, -0.9677734375, -0.886474609375, -0.80517578125, -0.723876953125, -0.642578125, -0.561279296875, -0.47998046875, -0.398681640625, -0.3173828125, -0.236083984375, -0.15478515625, -0.073486328125, 0.0078125, 0.089111328125, 0.17041015625, 0.251708984375, 0.3330078125, 0.414306640625, 0.49560546875, 0.576904296875, 0.658203125, 0.739501953125, 0.82080078125, 0.902099609375, 0.9833984375, 1.064697265625, 1.14599609375, 1.227294921875, 1.30859375, 1.389892578125, 1.47119140625, 1.552490234375, 1.6337890625, 1.715087890625, 1.79638671875, 1.877685546875, 1.958984375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 22.0, 25.0, 53.0, 83.0, 186.0, 403.0, 983.0, 3750.0, 37607.0, 3871668.0, 267774.0, 8891.0, 1716.0, 575.0, 259.0, 116.0, 81.0, 36.0, 20.0, 12.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-10.875, -10.60125732421875, -10.3275146484375, -10.05377197265625, -9.780029296875, -9.50628662109375, -9.2325439453125, -8.95880126953125, -8.68505859375, -8.41131591796875, -8.1375732421875, -7.86383056640625, -7.590087890625, -7.31634521484375, -7.0426025390625, -6.76885986328125, -6.4951171875, -6.22137451171875, -5.9476318359375, -5.67388916015625, -5.400146484375, -5.12640380859375, -4.8526611328125, -4.57891845703125, -4.30517578125, -4.03143310546875, -3.7576904296875, -3.48394775390625, -3.210205078125, -2.93646240234375, -2.6627197265625, -2.38897705078125, -2.115234375, -1.84149169921875, -1.5677490234375, -1.29400634765625, -1.020263671875, -0.74652099609375, -0.4727783203125, -0.19903564453125, 0.07470703125, 0.34844970703125, 0.6221923828125, 0.89593505859375, 1.169677734375, 1.44342041015625, 1.7171630859375, 1.99090576171875, 2.2646484375, 2.53839111328125, 2.8121337890625, 3.08587646484375, 3.359619140625, 3.63336181640625, 3.9071044921875, 4.18084716796875, 4.45458984375, 4.72833251953125, 5.0020751953125, 5.27581787109375, 5.549560546875, 5.82330322265625, 6.0970458984375, 6.37078857421875, 6.64453125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 10.0, 18.0, 23.0, 46.0, 85.0, 147.0, 345.0, 821.0, 1138.0, 790.0, 319.0, 166.0, 75.0, 40.0, 18.0, 11.0, 7.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5361328125, -1.4706878662109375, -1.405242919921875, -1.3397979736328125, -1.27435302734375, -1.2089080810546875, -1.143463134765625, -1.0780181884765625, -1.0125732421875, -0.9471282958984375, -0.881683349609375, -0.8162384033203125, -0.75079345703125, -0.6853485107421875, -0.619903564453125, -0.5544586181640625, -0.489013671875, -0.4235687255859375, -0.358123779296875, -0.2926788330078125, -0.22723388671875, -0.1617889404296875, -0.096343994140625, -0.0308990478515625, 0.0345458984375, 0.0999908447265625, 0.165435791015625, 0.2308807373046875, 0.29632568359375, 0.3617706298828125, 0.427215576171875, 0.4926605224609375, 0.55810546875, 0.6235504150390625, 0.688995361328125, 0.7544403076171875, 0.81988525390625, 0.8853302001953125, 0.950775146484375, 1.0162200927734375, 1.0816650390625, 1.1471099853515625, 1.212554931640625, 1.2779998779296875, 1.34344482421875, 1.4088897705078125, 1.474334716796875, 1.5397796630859375, 1.605224609375, 1.6706695556640625, 1.736114501953125, 1.8015594482421875, 1.86700439453125, 1.9324493408203125, 1.997894287109375, 2.0633392333984375, 2.1287841796875, 2.1942291259765625, 2.259674072265625, 2.3251190185546875, 2.39056396484375, 2.4560089111328125, 2.521453857421875, 2.5868988037109375, 2.65234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 8.0, 9.0, 11.0, 19.0, 7.0, 30.0, 26.0, 42.0, 42.0, 50.0, 52.0, 68.0, 70.0, 66.0, 72.0, 72.0, 63.0, 56.0, 53.0, 34.0, 34.0, 28.0, 18.0, 22.0, 17.0, 8.0, 5.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-4.512925148010254, -4.408871173858643, -4.304817199707031, -4.20076322555542, -4.096709251403809, -3.9926552772521973, -3.888601303100586, -3.7845473289489746, -3.6804933547973633, -3.576439380645752, -3.4723854064941406, -3.3683314323425293, -3.264277458190918, -3.1602234840393066, -3.0561695098876953, -2.952115535736084, -2.8480613231658936, -2.7440073490142822, -2.639953374862671, -2.5358994007110596, -2.4318454265594482, -2.327791452407837, -2.2237372398376465, -2.119683265686035, -2.015629291534424, -1.9115753173828125, -1.8075213432312012, -1.7034673690795898, -1.5994133949279785, -1.4953594207763672, -1.3913053274154663, -1.287251353263855, -1.1831974983215332, -1.0791435241699219, -0.9750895500183105, -0.8710355162620544, -0.7669815421104431, -0.6629275679588318, -0.5588735342025757, -0.45481956005096436, -0.350765585899353, -0.2467115968465805, -0.14265760779380798, -0.03860360383987427, 0.06545037031173706, 0.1695043444633484, 0.2735583782196045, 0.3776123523712158, 0.48166632652282715, 0.5857203006744385, 0.6897742748260498, 0.7938283085823059, 0.8978822827339172, 1.0019361972808838, 1.1059902906417847, 1.210044264793396, 1.3140982389450073, 1.4181522130966187, 1.52220618724823, 1.6262602806091309, 1.7303142547607422, 1.8343682289123535, 1.9384222030639648, 2.042476177215576, 2.1465301513671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 14.0, 7.0, 15.0, 15.0, 22.0, 22.0, 23.0, 27.0, 35.0, 27.0, 33.0, 37.0, 38.0, 45.0, 45.0, 46.0, 47.0, 37.0, 34.0, 33.0, 40.0, 36.0, 34.0, 29.0, 27.0, 25.0, 29.0, 26.0, 26.0, 21.0, 11.0, 13.0, 7.0, 12.0, 11.0, 3.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2501275539398193, -2.178273916244507, -2.1064205169677734, -2.034566879272461, -1.962713360786438, -1.890859842300415, -1.8190062046051025, -1.7471526861190796, -1.6752991676330566, -1.6034456491470337, -1.5315921306610107, -1.4597384929656982, -1.3878849744796753, -1.3160314559936523, -1.2441778182983398, -1.172324299812317, -1.100470781326294, -1.028617262840271, -0.9567636847496033, -0.8849101066589355, -0.8130565881729126, -0.7412030696868896, -0.6693494915962219, -0.5974959135055542, -0.5256423950195312, -0.4537888467311859, -0.3819352984428406, -0.31008175015449524, -0.2382282018661499, -0.16637465357780457, -0.09452110528945923, -0.022667527198791504, 0.04918622970581055, 0.12103977799415588, 0.19289332628250122, 0.26474687457084656, 0.3366004228591919, 0.40845397114753723, 0.48030751943588257, 0.5521610975265503, 0.6240146160125732, 0.6958681344985962, 0.7677217125892639, 0.8395752906799316, 0.9114288091659546, 0.9832823276519775, 1.05513596534729, 1.126989483833313, 1.198843002319336, 1.2706965208053589, 1.3425500392913818, 1.4144036769866943, 1.4862571954727173, 1.5581107139587402, 1.6299643516540527, 1.7018178701400757, 1.7736713886260986, 1.8455249071121216, 1.9173784255981445, 1.989232063293457, 2.0610857009887695, 2.132939100265503, 2.2047927379608154, 2.276646137237549, 2.3484997749328613]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 10.0, 6.0, 4.0, 15.0, 21.0, 25.0, 42.0, 74.0, 145.0, 182.0, 334.0, 586.0, 1251.0, 3765.0, 20566.0, 261265.0, 704924.0, 45386.0, 6399.0, 1768.0, 765.0, 379.0, 227.0, 135.0, 90.0, 65.0, 44.0, 26.0, 14.0, 16.0, 10.0, 9.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.689453125, -1.64520263671875, -1.6009521484375, -1.55670166015625, -1.512451171875, -1.46820068359375, -1.4239501953125, -1.37969970703125, -1.33544921875, -1.29119873046875, -1.2469482421875, -1.20269775390625, -1.158447265625, -1.11419677734375, -1.0699462890625, -1.02569580078125, -0.9814453125, -0.93719482421875, -0.8929443359375, -0.84869384765625, -0.804443359375, -0.76019287109375, -0.7159423828125, -0.67169189453125, -0.62744140625, -0.58319091796875, -0.5389404296875, -0.49468994140625, -0.450439453125, -0.40618896484375, -0.3619384765625, -0.31768798828125, -0.2734375, -0.22918701171875, -0.1849365234375, -0.14068603515625, -0.096435546875, -0.05218505859375, -0.0079345703125, 0.03631591796875, 0.08056640625, 0.12481689453125, 0.1690673828125, 0.21331787109375, 0.257568359375, 0.30181884765625, 0.3460693359375, 0.39031982421875, 0.4345703125, 0.47882080078125, 0.5230712890625, 0.56732177734375, 0.611572265625, 0.65582275390625, 0.7000732421875, 0.74432373046875, 0.78857421875, 0.83282470703125, 0.8770751953125, 0.92132568359375, 0.965576171875, 1.00982666015625, 1.0540771484375, 1.09832763671875, 1.142578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 10.0, 8.0, 13.0, 14.0, 23.0, 27.0, 38.0, 33.0, 51.0, 66.0, 68.0, 72.0, 77.0, 72.0, 70.0, 66.0, 62.0, 39.0, 50.0, 45.0, 38.0, 18.0, 23.0, 7.0, 8.0, 1.0, 4.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.8283538818359375, -1.749481201171875, -1.6706085205078125, -1.59173583984375, -1.5128631591796875, -1.433990478515625, -1.3551177978515625, -1.2762451171875, -1.1973724365234375, -1.118499755859375, -1.0396270751953125, -0.96075439453125, -0.8818817138671875, -0.803009033203125, -0.7241363525390625, -0.645263671875, -0.5663909912109375, -0.487518310546875, -0.4086456298828125, -0.32977294921875, -0.2509002685546875, -0.172027587890625, -0.0931549072265625, -0.0142822265625, 0.0645904541015625, 0.143463134765625, 0.2223358154296875, 0.30120849609375, 0.3800811767578125, 0.458953857421875, 0.5378265380859375, 0.61669921875, 0.6955718994140625, 0.774444580078125, 0.8533172607421875, 0.93218994140625, 1.0110626220703125, 1.089935302734375, 1.1688079833984375, 1.2476806640625, 1.3265533447265625, 1.405426025390625, 1.4842987060546875, 1.56317138671875, 1.6420440673828125, 1.720916748046875, 1.7997894287109375, 1.878662109375, 1.9575347900390625, 2.036407470703125, 2.1152801513671875, 2.19415283203125, 2.2730255126953125, 2.351898193359375, 2.4307708740234375, 2.5096435546875, 2.5885162353515625, 2.667388916015625, 2.7462615966796875, 2.82513427734375, 2.9040069580078125, 2.982879638671875, 3.0617523193359375, 3.140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 5.0, 8.0, 20.0, 19.0, 36.0, 49.0, 55.0, 86.0, 171.0, 232.0, 354.0, 604.0, 1014.0, 1721.0, 3203.0, 5859.0, 11259.0, 23462.0, 51125.0, 137095.0, 416273.0, 248178.0, 80833.0, 33524.0, 15912.0, 7943.0, 4112.0, 2207.0, 1248.0, 720.0, 439.0, 247.0, 150.0, 110.0, 91.0, 43.0, 40.0, 28.0, 17.0, 13.0, 4.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.403564453125, -0.3904380798339844, -0.37731170654296875, -0.3641853332519531, -0.3510589599609375, -0.3379325866699219, -0.32480621337890625, -0.3116798400878906, -0.298553466796875, -0.2854270935058594, -0.27230072021484375, -0.2591743469238281, -0.2460479736328125, -0.23292160034179688, -0.21979522705078125, -0.20666885375976562, -0.19354248046875, -0.18041610717773438, -0.16728973388671875, -0.15416336059570312, -0.1410369873046875, -0.12791061401367188, -0.11478424072265625, -0.10165786743164062, -0.088531494140625, -0.07540512084960938, -0.06227874755859375, -0.049152374267578125, -0.0360260009765625, -0.022899627685546875, -0.00977325439453125, 0.003353118896484375, 0.0164794921875, 0.029605865478515625, 0.04273223876953125, 0.055858612060546875, 0.0689849853515625, 0.08211135864257812, 0.09523773193359375, 0.10836410522460938, 0.121490478515625, 0.13461685180664062, 0.14774322509765625, 0.16086959838867188, 0.1739959716796875, 0.18712234497070312, 0.20024871826171875, 0.21337509155273438, 0.22650146484375, 0.23962783813476562, 0.25275421142578125, 0.2658805847167969, 0.2790069580078125, 0.2921333312988281, 0.30525970458984375, 0.3183860778808594, 0.331512451171875, 0.3446388244628906, 0.35776519775390625, 0.3708915710449219, 0.3840179443359375, 0.3971443176269531, 0.41027069091796875, 0.4233970642089844, 0.4365234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 6.0, 11.0, 5.0, 12.0, 18.0, 16.0, 13.0, 36.0, 26.0, 39.0, 35.0, 41.0, 36.0, 38.0, 54.0, 47.0, 39.0, 51.0, 42.0, 34.0, 33.0, 50.0, 34.0, 39.0, 34.0, 32.0, 21.0, 22.0, 14.0, 21.0, 16.0, 11.0, 16.0, 9.0, 3.0, 4.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7890625, -4.6392822265625, -4.489501953125, -4.3397216796875, -4.18994140625, -4.0401611328125, -3.890380859375, -3.7406005859375, -3.5908203125, -3.4410400390625, -3.291259765625, -3.1414794921875, -2.99169921875, -2.8419189453125, -2.692138671875, -2.5423583984375, -2.392578125, -2.2427978515625, -2.093017578125, -1.9432373046875, -1.79345703125, -1.6436767578125, -1.493896484375, -1.3441162109375, -1.1943359375, -1.0445556640625, -0.894775390625, -0.7449951171875, -0.59521484375, -0.4454345703125, -0.295654296875, -0.1458740234375, 0.00390625, 0.1536865234375, 0.303466796875, 0.4532470703125, 0.60302734375, 0.7528076171875, 0.902587890625, 1.0523681640625, 1.2021484375, 1.3519287109375, 1.501708984375, 1.6514892578125, 1.80126953125, 1.9510498046875, 2.100830078125, 2.2506103515625, 2.400390625, 2.5501708984375, 2.699951171875, 2.8497314453125, 2.99951171875, 3.1492919921875, 3.299072265625, 3.4488525390625, 3.5986328125, 3.7484130859375, 3.898193359375, 4.0479736328125, 4.19775390625, 4.3475341796875, 4.497314453125, 4.6470947265625, 4.796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 8.0, 8.0, 15.0, 15.0, 24.0, 46.0, 73.0, 141.0, 247.0, 474.0, 913.0, 2316.0, 7169.0, 41874.0, 665016.0, 296027.0, 25572.0, 5298.0, 1682.0, 735.0, 350.0, 203.0, 122.0, 71.0, 47.0, 27.0, 26.0, 16.0, 14.0, 8.0, 8.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.16518020629882812, -0.15982818603515625, -0.15447616577148438, -0.1491241455078125, -0.14377212524414062, -0.13842010498046875, -0.13306808471679688, -0.127716064453125, -0.12236404418945312, -0.11701202392578125, -0.11166000366210938, -0.1063079833984375, -0.10095596313476562, -0.09560394287109375, -0.09025192260742188, -0.08489990234375, -0.07954788208007812, -0.07419586181640625, -0.06884384155273438, -0.0634918212890625, -0.058139801025390625, -0.05278778076171875, -0.047435760498046875, -0.042083740234375, -0.036731719970703125, -0.03137969970703125, -0.026027679443359375, -0.0206756591796875, -0.015323638916015625, -0.00997161865234375, -0.004619598388671875, 0.000732421875, 0.006084442138671875, 0.01143646240234375, 0.016788482666015625, 0.0221405029296875, 0.027492523193359375, 0.03284454345703125, 0.038196563720703125, 0.043548583984375, 0.048900604248046875, 0.05425262451171875, 0.059604644775390625, 0.0649566650390625, 0.07030868530273438, 0.07566070556640625, 0.08101272583007812, 0.08636474609375, 0.09171676635742188, 0.09706878662109375, 0.10242080688476562, 0.1077728271484375, 0.11312484741210938, 0.11847686767578125, 0.12382888793945312, 0.129180908203125, 0.13453292846679688, 0.13988494873046875, 0.14523696899414062, 0.1505889892578125, 0.15594100952148438, 0.16129302978515625, 0.16664505004882812, 0.1719970703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 3.0, 5.0, 10.0, 16.0, 17.0, 50.0, 68.0, 101.0, 148.0, 178.0, 151.0, 95.0, 59.0, 35.0, 20.0, 17.0, 8.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001157522201538086, -0.00011194311082363129, -0.00010813400149345398, -0.00010432489216327667, -0.00010051578283309937, -9.670667350292206e-05, -9.289756417274475e-05, -8.908845484256744e-05, -8.527934551239014e-05, -8.147023618221283e-05, -7.766112685203552e-05, -7.385201752185822e-05, -7.004290819168091e-05, -6.62337988615036e-05, -6.24246895313263e-05, -5.861558020114899e-05, -5.480647087097168e-05, -5.099736154079437e-05, -4.7188252210617065e-05, -4.337914288043976e-05, -3.957003355026245e-05, -3.5760924220085144e-05, -3.195181488990784e-05, -2.814270555973053e-05, -2.4333596229553223e-05, -2.0524486899375916e-05, -1.671537756919861e-05, -1.2906268239021301e-05, -9.097158908843994e-06, -5.288049578666687e-06, -1.4789402484893799e-06, 2.3301690816879272e-06, 6.139278411865234e-06, 9.948387742042542e-06, 1.3757497072219849e-05, 1.7566606402397156e-05, 2.1375715732574463e-05, 2.518482506275177e-05, 2.8993934392929077e-05, 3.2803043723106384e-05, 3.661215305328369e-05, 4.0421262383461e-05, 4.4230371713638306e-05, 4.803948104381561e-05, 5.184859037399292e-05, 5.565769970417023e-05, 5.9466809034347534e-05, 6.327591836452484e-05, 6.708502769470215e-05, 7.089413702487946e-05, 7.470324635505676e-05, 7.851235568523407e-05, 8.232146501541138e-05, 8.613057434558868e-05, 8.993968367576599e-05, 9.37487930059433e-05, 9.75579023361206e-05, 0.00010136701166629791, 0.00010517612099647522, 0.00010898523032665253, 0.00011279433965682983, 0.00011660344898700714, 0.00012041255831718445, 0.00012422166764736176, 0.00012803077697753906]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 7.0, 1.0, 5.0, 4.0, 4.0, 4.0, 6.0, 13.0, 25.0, 26.0, 34.0, 43.0, 55.0, 65.0, 130.0, 170.0, 310.0, 465.0, 861.0, 1530.0, 2996.0, 6780.0, 16631.0, 51416.0, 255675.0, 580087.0, 89073.0, 24771.0, 9072.0, 3961.0, 1874.0, 959.0, 511.0, 325.0, 192.0, 132.0, 95.0, 66.0, 59.0, 28.0, 24.0, 21.0, 12.0, 10.0, 9.0, 7.0, 9.0, 2.0, 6.0, 0.0, 0.0, 2.0, 4.0], "bins": [-0.138427734375, -0.13460445404052734, -0.1307811737060547, -0.12695789337158203, -0.12313461303710938, -0.11931133270263672, -0.11548805236816406, -0.1116647720336914, -0.10784149169921875, -0.1040182113647461, -0.10019493103027344, -0.09637165069580078, -0.09254837036132812, -0.08872509002685547, -0.08490180969238281, -0.08107852935791016, -0.0772552490234375, -0.07343196868896484, -0.06960868835449219, -0.06578540802001953, -0.061962127685546875, -0.05813884735107422, -0.05431556701660156, -0.050492286682128906, -0.04666900634765625, -0.042845726013183594, -0.03902244567871094, -0.03519916534423828, -0.031375885009765625, -0.02755260467529297, -0.023729324340820312, -0.019906044006347656, -0.016082763671875, -0.012259483337402344, -0.008436203002929688, -0.004612922668457031, -0.000789642333984375, 0.0030336380004882812, 0.0068569183349609375, 0.010680198669433594, 0.01450347900390625, 0.018326759338378906, 0.022150039672851562, 0.02597332000732422, 0.029796600341796875, 0.03361988067626953, 0.03744316101074219, 0.041266441345214844, 0.0450897216796875, 0.048913002014160156, 0.05273628234863281, 0.05655956268310547, 0.060382843017578125, 0.06420612335205078, 0.06802940368652344, 0.0718526840209961, 0.07567596435546875, 0.0794992446899414, 0.08332252502441406, 0.08714580535888672, 0.09096908569335938, 0.09479236602783203, 0.09861564636230469, 0.10243892669677734, 0.10626220703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 4.0, 11.0, 13.0, 15.0, 19.0, 39.0, 53.0, 89.0, 170.0, 262.0, 136.0, 67.0, 45.0, 28.0, 12.0, 13.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050323486328125, -0.04866218566894531, -0.047000885009765625, -0.04533958435058594, -0.04367828369140625, -0.04201698303222656, -0.040355682373046875, -0.03869438171386719, -0.0370330810546875, -0.03537178039550781, -0.033710479736328125, -0.03204917907714844, -0.03038787841796875, -0.028726577758789062, -0.027065277099609375, -0.025403976440429688, -0.02374267578125, -0.022081375122070312, -0.020420074462890625, -0.018758773803710938, -0.01709747314453125, -0.015436172485351562, -0.013774871826171875, -0.012113571166992188, -0.0104522705078125, -0.008790969848632812, -0.007129669189453125, -0.0054683685302734375, -0.00380706787109375, -0.0021457672119140625, -0.000484466552734375, 0.0011768341064453125, 0.002838134765625, 0.0044994354248046875, 0.006160736083984375, 0.007822036743164062, 0.00948333740234375, 0.011144638061523438, 0.012805938720703125, 0.014467239379882812, 0.0161285400390625, 0.017789840698242188, 0.019451141357421875, 0.021112442016601562, 0.02277374267578125, 0.024435043334960938, 0.026096343994140625, 0.027757644653320312, 0.0294189453125, 0.031080245971679688, 0.032741546630859375, 0.03440284729003906, 0.03606414794921875, 0.03772544860839844, 0.039386749267578125, 0.04104804992675781, 0.0427093505859375, 0.04437065124511719, 0.046031951904296875, 0.04769325256347656, 0.04935455322265625, 0.05101585388183594, 0.052677154541015625, 0.05433845520019531, 0.055999755859375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 18.0, 48.0, 81.0, 170.0, 196.0, 225.0, 126.0, 80.0, 42.0, 14.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6458585262298584, -3.462466239929199, -3.279074192047119, -3.095682144165039, -2.91228985786438, -2.7288975715637207, -2.5455055236816406, -2.3621134757995605, -2.1787211894989014, -1.9953290224075317, -1.811936855316162, -1.6285446882247925, -1.4451525211334229, -1.2617603540420532, -1.0783681869506836, -0.894976019859314, -0.7115838527679443, -0.5281916856765747, -0.3447995185852051, -0.16140735149383545, 0.02198481559753418, 0.2053769826889038, 0.38876914978027344, 0.5721613168716431, 0.7555534839630127, 0.9389456510543823, 1.122337818145752, 1.3057299852371216, 1.4891221523284912, 1.6725143194198608, 1.8559064865112305, 2.0392985343933105, 2.2226905822753906, 2.4060826301574707, 2.58947491645813, 2.772867202758789, 2.956259250640869, 3.139651298522949, 3.3230435848236084, 3.5064358711242676, 3.6898279190063477, 3.8732199668884277, 4.056612014770508, 4.240004539489746, 4.423396587371826, 4.606788635253906, 4.7901811599731445, 4.973573207855225, 5.156965255737305, 5.340357303619385, 5.523749351501465, 5.707141876220703, 5.890533924102783, 6.073925971984863, 6.257318496704102, 6.440710544586182, 6.624102592468262, 6.807494640350342, 6.990886688232422, 7.17427921295166, 7.35767126083374, 7.54106330871582, 7.724455833435059, 7.907847881317139, 8.091239929199219]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 8.0, 18.0, 13.0, 21.0, 22.0, 34.0, 44.0, 53.0, 44.0, 66.0, 66.0, 67.0, 80.0, 62.0, 57.0, 61.0, 50.0, 44.0, 41.0, 47.0, 31.0, 23.0, 13.0, 9.0, 12.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7804067134857178, -1.7105568647384644, -1.640707015991211, -1.570857286453247, -1.5010074377059937, -1.4311575889587402, -1.3613078594207764, -1.291458010673523, -1.2216081619262695, -1.1517583131790161, -1.0819084644317627, -1.0120587348937988, -0.9422088861465454, -0.872359037399292, -0.8025092482566833, -0.7326594591140747, -0.6628096103668213, -0.5929597616195679, -0.5231099724769592, -0.4532601535320282, -0.38341033458709717, -0.31356051564216614, -0.2437106966972351, -0.17386087775230408, -0.10401105880737305, -0.03416123986244202, 0.035688579082489014, 0.10553839802742004, 0.17538821697235107, 0.2452380359172821, 0.31508785486221313, 0.38493767380714417, 0.4547877311706543, 0.5246375799179077, 0.5944873690605164, 0.664337158203125, 0.7341870069503784, 0.8040368556976318, 0.8738866448402405, 0.9437364339828491, 1.0135862827301025, 1.083436131477356, 1.1532859802246094, 1.2231357097625732, 1.2929855585098267, 1.36283540725708, 1.432685136795044, 1.5025349855422974, 1.5723848342895508, 1.6422346830368042, 1.7120845317840576, 1.7819342613220215, 1.851784110069275, 1.9216339588165283, 1.9914836883544922, 2.061333656311035, 2.131183385848999, 2.201033115386963, 2.270883083343506, 2.3407328128814697, 2.4105825424194336, 2.4804325103759766, 2.5502822399139404, 2.6201322078704834, 2.6899819374084473]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 5.0, 3.0, 5.0, 11.0, 13.0, 18.0, 29.0, 45.0, 45.0, 80.0, 130.0, 237.0, 394.0, 943.0, 2993.0, 21244.0, 261115.0, 677169.0, 73875.0, 7283.0, 1544.0, 585.0, 302.0, 175.0, 118.0, 47.0, 47.0, 34.0, 18.0, 11.0, 12.0, 8.0, 7.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.2379150390625, -6.038330078125, -5.8387451171875, -5.63916015625, -5.4395751953125, -5.239990234375, -5.0404052734375, -4.8408203125, -4.6412353515625, -4.441650390625, -4.2420654296875, -4.04248046875, -3.8428955078125, -3.643310546875, -3.4437255859375, -3.244140625, -3.0445556640625, -2.844970703125, -2.6453857421875, -2.44580078125, -2.2462158203125, -2.046630859375, -1.8470458984375, -1.6474609375, -1.4478759765625, -1.248291015625, -1.0487060546875, -0.84912109375, -0.6495361328125, -0.449951171875, -0.2503662109375, -0.05078125, 0.1488037109375, 0.348388671875, 0.5479736328125, 0.74755859375, 0.9471435546875, 1.146728515625, 1.3463134765625, 1.5458984375, 1.7454833984375, 1.945068359375, 2.1446533203125, 2.34423828125, 2.5438232421875, 2.743408203125, 2.9429931640625, 3.142578125, 3.3421630859375, 3.541748046875, 3.7413330078125, 3.94091796875, 4.1405029296875, 4.340087890625, 4.5396728515625, 4.7392578125, 4.9388427734375, 5.138427734375, 5.3380126953125, 5.53759765625, 5.7371826171875, 5.936767578125, 6.1363525390625, 6.3359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 12.0, 21.0, 24.0, 31.0, 38.0, 43.0, 64.0, 57.0, 69.0, 84.0, 81.0, 89.0, 69.0, 65.0, 53.0, 39.0, 45.0, 33.0, 25.0, 21.0, 10.0, 6.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.93365478515625, -3.8009033203125, -3.66815185546875, -3.535400390625, -3.40264892578125, -3.2698974609375, -3.13714599609375, -3.00439453125, -2.87164306640625, -2.7388916015625, -2.60614013671875, -2.473388671875, -2.34063720703125, -2.2078857421875, -2.07513427734375, -1.9423828125, -1.80963134765625, -1.6768798828125, -1.54412841796875, -1.411376953125, -1.27862548828125, -1.1458740234375, -1.01312255859375, -0.88037109375, -0.74761962890625, -0.6148681640625, -0.48211669921875, -0.349365234375, -0.21661376953125, -0.0838623046875, 0.04888916015625, 0.181640625, 0.31439208984375, 0.4471435546875, 0.57989501953125, 0.712646484375, 0.84539794921875, 0.9781494140625, 1.11090087890625, 1.24365234375, 1.37640380859375, 1.5091552734375, 1.64190673828125, 1.774658203125, 1.90740966796875, 2.0401611328125, 2.17291259765625, 2.3056640625, 2.43841552734375, 2.5711669921875, 2.70391845703125, 2.836669921875, 2.96942138671875, 3.1021728515625, 3.23492431640625, 3.36767578125, 3.50042724609375, 3.6331787109375, 3.76593017578125, 3.898681640625, 4.03143310546875, 4.1641845703125, 4.29693603515625, 4.4296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 8.0, 3.0, 8.0, 10.0, 7.0, 9.0, 18.0, 36.0, 51.0, 64.0, 137.0, 228.0, 378.0, 731.0, 1294.0, 2982.0, 8432.0, 38212.0, 287077.0, 587397.0, 96748.0, 15951.0, 4686.0, 1926.0, 938.0, 500.0, 268.0, 156.0, 109.0, 70.0, 45.0, 27.0, 16.0, 7.0, 3.0, 3.0, 5.0, 4.0, 6.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5078125, -5.34210205078125, -5.1763916015625, -5.01068115234375, -4.844970703125, -4.67926025390625, -4.5135498046875, -4.34783935546875, -4.18212890625, -4.01641845703125, -3.8507080078125, -3.68499755859375, -3.519287109375, -3.35357666015625, -3.1878662109375, -3.02215576171875, -2.8564453125, -2.69073486328125, -2.5250244140625, -2.35931396484375, -2.193603515625, -2.02789306640625, -1.8621826171875, -1.69647216796875, -1.53076171875, -1.36505126953125, -1.1993408203125, -1.03363037109375, -0.867919921875, -0.70220947265625, -0.5364990234375, -0.37078857421875, -0.205078125, -0.03936767578125, 0.1263427734375, 0.29205322265625, 0.457763671875, 0.62347412109375, 0.7891845703125, 0.95489501953125, 1.12060546875, 1.28631591796875, 1.4520263671875, 1.61773681640625, 1.783447265625, 1.94915771484375, 2.1148681640625, 2.28057861328125, 2.4462890625, 2.61199951171875, 2.7777099609375, 2.94342041015625, 3.109130859375, 3.27484130859375, 3.4405517578125, 3.60626220703125, 3.77197265625, 3.93768310546875, 4.1033935546875, 4.26910400390625, 4.434814453125, 4.60052490234375, 4.7662353515625, 4.93194580078125, 5.09765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 9.0, 14.0, 21.0, 22.0, 34.0, 42.0, 47.0, 52.0, 63.0, 73.0, 72.0, 63.0, 78.0, 84.0, 54.0, 53.0, 48.0, 31.0, 30.0, 18.0, 19.0, 14.0, 23.0, 5.0, 1.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3203125, -4.16845703125, -4.0166015625, -3.86474609375, -3.712890625, -3.56103515625, -3.4091796875, -3.25732421875, -3.10546875, -2.95361328125, -2.8017578125, -2.64990234375, -2.498046875, -2.34619140625, -2.1943359375, -2.04248046875, -1.890625, -1.73876953125, -1.5869140625, -1.43505859375, -1.283203125, -1.13134765625, -0.9794921875, -0.82763671875, -0.67578125, -0.52392578125, -0.3720703125, -0.22021484375, -0.068359375, 0.08349609375, 0.2353515625, 0.38720703125, 0.5390625, 0.69091796875, 0.8427734375, 0.99462890625, 1.146484375, 1.29833984375, 1.4501953125, 1.60205078125, 1.75390625, 1.90576171875, 2.0576171875, 2.20947265625, 2.361328125, 2.51318359375, 2.6650390625, 2.81689453125, 2.96875, 3.12060546875, 3.2724609375, 3.42431640625, 3.576171875, 3.72802734375, 3.8798828125, 4.03173828125, 4.18359375, 4.33544921875, 4.4873046875, 4.63916015625, 4.791015625, 4.94287109375, 5.0947265625, 5.24658203125, 5.3984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 12.0, 30.0, 28.0, 36.0, 66.0, 92.0, 145.0, 221.0, 315.0, 531.0, 977.0, 1892.0, 3830.0, 8817.0, 21940.0, 62805.0, 199575.0, 471117.0, 181939.0, 57754.0, 20444.0, 8197.0, 3597.0, 1763.0, 970.0, 511.0, 323.0, 201.0, 137.0, 93.0, 57.0, 40.0, 23.0, 11.0, 25.0, 9.0, 9.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.73779296875, -0.7150650024414062, -0.6923370361328125, -0.6696090698242188, -0.646881103515625, -0.6241531372070312, -0.6014251708984375, -0.5786972045898438, -0.55596923828125, -0.5332412719726562, -0.5105133056640625, -0.48778533935546875, -0.465057373046875, -0.44232940673828125, -0.4196014404296875, -0.39687347412109375, -0.3741455078125, -0.35141754150390625, -0.3286895751953125, -0.30596160888671875, -0.283233642578125, -0.26050567626953125, -0.2377777099609375, -0.21504974365234375, -0.19232177734375, -0.16959381103515625, -0.1468658447265625, -0.12413787841796875, -0.101409912109375, -0.07868194580078125, -0.0559539794921875, -0.03322601318359375, -0.010498046875, 0.01222991943359375, 0.0349578857421875, 0.05768585205078125, 0.080413818359375, 0.10314178466796875, 0.1258697509765625, 0.14859771728515625, 0.17132568359375, 0.19405364990234375, 0.2167816162109375, 0.23950958251953125, 0.262237548828125, 0.28496551513671875, 0.3076934814453125, 0.33042144775390625, 0.3531494140625, 0.37587738037109375, 0.3986053466796875, 0.42133331298828125, 0.444061279296875, 0.46678924560546875, 0.4895172119140625, 0.5122451782226562, 0.53497314453125, 0.5577011108398438, 0.5804290771484375, 0.6031570434570312, 0.625885009765625, 0.6486129760742188, 0.6713409423828125, 0.6940689086914062, 0.716796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 6.0, 7.0, 7.0, 19.0, 29.0, 27.0, 32.0, 39.0, 48.0, 68.0, 65.0, 94.0, 131.0, 58.0, 56.0, 59.0, 49.0, 41.0, 33.0, 26.0, 22.0, 17.0, 13.0, 4.0, 7.0, 4.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001786947250366211, -0.00017332099378108978, -0.00016794726252555847, -0.00016257353127002716, -0.00015719980001449585, -0.00015182606875896454, -0.00014645233750343323, -0.00014107860624790192, -0.0001357048749923706, -0.0001303311437368393, -0.00012495741248130798, -0.00011958368122577667, -0.00011420994997024536, -0.00010883621871471405, -0.00010346248745918274, -9.808875620365143e-05, -9.271502494812012e-05, -8.73412936925888e-05, -8.19675624370575e-05, -7.659383118152618e-05, -7.122009992599487e-05, -6.584636867046356e-05, -6.047263741493225e-05, -5.509890615940094e-05, -4.972517490386963e-05, -4.435144364833832e-05, -3.897771239280701e-05, -3.3603981137275696e-05, -2.8230249881744385e-05, -2.2856518626213074e-05, -1.7482787370681763e-05, -1.2109056115150452e-05, -6.735324859619141e-06, -1.3615936040878296e-06, 4.0121376514434814e-06, 9.385868906974792e-06, 1.4759600162506104e-05, 2.0133331418037415e-05, 2.5507062673568726e-05, 3.088079392910004e-05, 3.625452518463135e-05, 4.162825644016266e-05, 4.700198769569397e-05, 5.237571895122528e-05, 5.774945020675659e-05, 6.31231814622879e-05, 6.849691271781921e-05, 7.387064397335052e-05, 7.924437522888184e-05, 8.461810648441315e-05, 8.999183773994446e-05, 9.536556899547577e-05, 0.00010073930025100708, 0.00010611303150653839, 0.0001114867627620697, 0.00011686049401760101, 0.00012223422527313232, 0.00012760795652866364, 0.00013298168778419495, 0.00013835541903972626, 0.00014372915029525757, 0.00014910288155078888, 0.0001544766128063202, 0.0001598503440618515, 0.0001652240753173828]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 5.0, 0.0, 6.0, 9.0, 9.0, 10.0, 17.0, 16.0, 34.0, 44.0, 57.0, 85.0, 149.0, 240.0, 361.0, 721.0, 1439.0, 3371.0, 8396.0, 29076.0, 173505.0, 671393.0, 123960.0, 22966.0, 6926.0, 2826.0, 1289.0, 659.0, 386.0, 211.0, 107.0, 69.0, 59.0, 31.0, 29.0, 26.0, 17.0, 17.0, 4.0, 6.0, 5.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.8212890625, -1.76837158203125, -1.7154541015625, -1.66253662109375, -1.609619140625, -1.55670166015625, -1.5037841796875, -1.45086669921875, -1.39794921875, -1.34503173828125, -1.2921142578125, -1.23919677734375, -1.186279296875, -1.13336181640625, -1.0804443359375, -1.02752685546875, -0.974609375, -0.92169189453125, -0.8687744140625, -0.81585693359375, -0.762939453125, -0.71002197265625, -0.6571044921875, -0.60418701171875, -0.55126953125, -0.49835205078125, -0.4454345703125, -0.39251708984375, -0.339599609375, -0.28668212890625, -0.2337646484375, -0.18084716796875, -0.1279296875, -0.07501220703125, -0.0220947265625, 0.03082275390625, 0.083740234375, 0.13665771484375, 0.1895751953125, 0.24249267578125, 0.29541015625, 0.34832763671875, 0.4012451171875, 0.45416259765625, 0.507080078125, 0.55999755859375, 0.6129150390625, 0.66583251953125, 0.71875, 0.77166748046875, 0.8245849609375, 0.87750244140625, 0.930419921875, 0.98333740234375, 1.0362548828125, 1.08917236328125, 1.14208984375, 1.19500732421875, 1.2479248046875, 1.30084228515625, 1.353759765625, 1.40667724609375, 1.4595947265625, 1.51251220703125, 1.5654296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 11.0, 19.0, 43.0, 61.0, 96.0, 149.0, 241.0, 131.0, 77.0, 54.0, 36.0, 27.0, 17.0, 7.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.01617431640625, -0.9825439453125, -0.94891357421875, -0.915283203125, -0.88165283203125, -0.8480224609375, -0.81439208984375, -0.78076171875, -0.74713134765625, -0.7135009765625, -0.67987060546875, -0.646240234375, -0.61260986328125, -0.5789794921875, -0.54534912109375, -0.51171875, -0.47808837890625, -0.4444580078125, -0.41082763671875, -0.377197265625, -0.34356689453125, -0.3099365234375, -0.27630615234375, -0.24267578125, -0.20904541015625, -0.1754150390625, -0.14178466796875, -0.108154296875, -0.07452392578125, -0.0408935546875, -0.00726318359375, 0.0263671875, 0.05999755859375, 0.0936279296875, 0.12725830078125, 0.160888671875, 0.19451904296875, 0.2281494140625, 0.26177978515625, 0.29541015625, 0.32904052734375, 0.3626708984375, 0.39630126953125, 0.429931640625, 0.46356201171875, 0.4971923828125, 0.53082275390625, 0.564453125, 0.59808349609375, 0.6317138671875, 0.66534423828125, 0.698974609375, 0.73260498046875, 0.7662353515625, 0.79986572265625, 0.83349609375, 0.86712646484375, 0.9007568359375, 0.93438720703125, 0.968017578125, 1.00164794921875, 1.0352783203125, 1.06890869140625, 1.1025390625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 16.0, 65.0, 121.0, 217.0, 253.0, 185.0, 95.0, 24.0, 9.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.671242713928223, -11.243896484375, -10.816550254821777, -10.389204025268555, -9.961856842041016, -9.53451156616211, -9.10716438293457, -8.679818153381348, -8.252471923828125, -7.825125694274902, -7.39777946472168, -6.970432758331299, -6.543086528778076, -6.1157402992248535, -5.688393592834473, -5.26104736328125, -4.833701133728027, -4.406354904174805, -3.979008436203003, -3.551661968231201, -3.1243157386779785, -2.696969509124756, -2.269623041152954, -1.8422765731811523, -1.4149303436279297, -0.9875839948654175, -0.5602376461029053, -0.13289129734039307, 0.29445505142211914, 0.7218012809753418, 1.1491477489471436, 1.5764942169189453, 2.003840446472168, 2.4311866760253906, 2.8585331439971924, 3.285879611968994, 3.713225841522217, 4.1405720710754395, 4.56791877746582, 4.995265007019043, 5.422611236572266, 5.849957466125488, 6.277303695678711, 6.704650402069092, 7.1319966316223145, 7.559342861175537, 7.986689567565918, 8.41403579711914, 8.841382026672363, 9.268728256225586, 9.696074485778809, 10.123420715332031, 10.55076789855957, 10.978113174438477, 11.405460357666016, 11.832806587219238, 12.260152816772461, 12.687499046325684, 13.114845275878906, 13.542191505432129, 13.969537734985352, 14.39688491821289, 14.824231147766113, 15.251577377319336, 15.678923606872559]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 7.0, 5.0, 10.0, 9.0, 16.0, 14.0, 20.0, 34.0, 35.0, 31.0, 38.0, 40.0, 53.0, 62.0, 48.0, 65.0, 69.0, 45.0, 45.0, 44.0, 61.0, 42.0, 39.0, 36.0, 33.0, 23.0, 23.0, 13.0, 9.0, 10.0, 11.0, 5.0, 8.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.266835689544678, -7.066995620727539, -6.8671555519104, -6.667315483093262, -6.467475414276123, -6.267635345458984, -6.067795276641846, -5.867955207824707, -5.668115139007568, -5.46827507019043, -5.268435001373291, -5.068594932556152, -4.868754863739014, -4.668914794921875, -4.469074726104736, -4.269234657287598, -4.069394588470459, -3.8695545196533203, -3.6697144508361816, -3.469874382019043, -3.2700343132019043, -3.0701942443847656, -2.870354175567627, -2.6705141067504883, -2.4706740379333496, -2.270833969116211, -2.0709939002990723, -1.8711538314819336, -1.671313762664795, -1.4714736938476562, -1.2716336250305176, -1.071793556213379, -0.8719534873962402, -0.6721134185791016, -0.4722733497619629, -0.2724332809448242, -0.07259321212768555, 0.12724685668945312, 0.3270869255065918, 0.5269269943237305, 0.7267670631408691, 0.9266071319580078, 1.1264472007751465, 1.3262872695922852, 1.5261273384094238, 1.7259674072265625, 1.9258074760437012, 2.12564754486084, 2.3254876136779785, 2.525327682495117, 2.725167751312256, 2.9250078201293945, 3.124847888946533, 3.324687957763672, 3.5245280265808105, 3.724368095397949, 3.924208164215088, 4.124048233032227, 4.323888301849365, 4.523728370666504, 4.723568439483643, 4.923408508300781, 5.12324857711792, 5.323088645935059, 5.522928714752197]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 17.0, 24.0, 39.0, 67.0, 106.0, 208.0, 335.0, 519.0, 891.0, 1488.0, 2251.0, 1035347.0, 3574.0, 2227.0, 1426.0, 885.0, 505.0, 261.0, 170.0, 98.0, 72.0, 36.0, 20.0, 23.0, 8.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.990660190582275, -6.710498332977295, -6.4303364753723145, -6.150174617767334, -5.8700127601623535, -5.589850902557373, -5.309688568115234, -5.029526710510254, -4.749364852905273, -4.469202995300293, -4.1890411376953125, -3.908879280090332, -3.6287174224853516, -3.348555564880371, -3.0683934688568115, -2.788231611251831, -2.5080699920654297, -2.227908134460449, -1.9477462768554688, -1.6675843000411987, -1.3874224424362183, -1.1072605848312378, -0.8270986080169678, -0.5469367504119873, -0.26677489280700684, 0.01338699460029602, 0.2935488820075989, 0.5737107992172241, 0.8538726568222046, 1.134034514427185, 1.414196491241455, 1.6943583488464355, 1.9745197296142578, 2.2546815872192383, 2.5348434448242188, 2.815005302429199, 3.0951671600341797, 3.37532901763916, 3.6554911136627197, 3.9356529712677, 4.215814590454102, 4.495976448059082, 4.7761383056640625, 5.056300163269043, 5.336462020874023, 5.616623878479004, 5.896785736083984, 6.176947593688965, 6.4571099281311035, 6.737271785736084, 7.0174336433410645, 7.297595500946045, 7.577757358551025, 7.857919216156006, 8.138081550598145, 8.418243408203125, 8.698405265808105, 8.978567123413086, 9.258728981018066, 9.538890838623047, 9.819052696228027, 10.099214553833008, 10.379376411437988, 10.659538269042969, 10.93970012664795]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 14.0, 17.0, 7.0, 1.0, 1.0, 5.0, 7.0, 10.0, 13.0, 19.0, 15.0, 29.0, 62.0, 113.0, 281.0, 820.0, 2406.0, 7085.0, 51425508.0, 22990.0, 7501.0, 2925.0, 934.0, 302.0, 120.0, 62.0, 29.0, 24.0, 11.0, 10.0, 12.0, 7.0, 10.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.328125, -19.542625427246094, -18.757125854492188, -17.97162628173828, -17.186128616333008, -16.4006290435791, -15.615129470825195, -14.829629898071289, -14.0441312789917, -13.258631706237793, -12.473133087158203, -11.687633514404297, -10.90213394165039, -10.1166353225708, -9.331135749816895, -8.545637130737305, -7.760137557983398, -6.97463846206665, -6.189139366149902, -5.403639793395996, -4.618140697479248, -3.8326416015625, -3.0471420288085938, -2.2616429328918457, -1.4761438369750977, -0.6906446218490601, 0.09485459327697754, 0.8803539276123047, 1.6658530235290527, 2.451352119445801, 3.236851692199707, 4.022350788116455, 4.807851791381836, 5.593350887298584, 6.378849983215332, 7.164349555969238, 7.949848651885986, 8.735347747802734, 9.52084732055664, 10.306346893310547, 11.091845512390137, 11.877345085144043, 12.662843704223633, 13.448343276977539, 14.233842849731445, 15.019341468811035, 15.804841041564941, 16.59033966064453, 17.375839233398438, 18.161338806152344, 18.94683837890625, 19.732337951660156, 20.51783561706543, 21.303335189819336, 22.088834762573242, 22.87433433532715, 23.659832000732422, 24.445331573486328, 25.230831146240234, 26.01633071899414, 26.801828384399414, 27.58732795715332, 28.372827529907227, 29.158327102661133, 29.94382667541504]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 7.0, 9.0, 9.0, 11.0, 17.0, 18.0, 33.0, 49.0, 80.0, 135.0, 209.0, 283.0, 414.0, 542.0, 934.0, 1403.0, 2139.0, 3434.0, 5295.0, 8392.0, 13384.0, 21307.0, 33725.0, 54571.0, 89186.0, 151806.0, 266134.0, 462778.0, 3799730.0, 566439.0, 331194.0, 188108.0, 110390.0, 67055.0, 41242.0, 26179.0, 16325.0, 10193.0, 6670.0, 4241.0, 2596.0, 1650.0, 1091.0, 684.0, 456.0, 292.0, 216.0, 137.0, 92.0, 51.0, 35.0, 26.0, 9.0, 13.0, 10.0, 5.0, 11.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.873046875, -0.8445968627929688, -0.8161468505859375, -0.7876968383789062, -0.759246826171875, -0.7307968139648438, -0.7023468017578125, -0.6738967895507812, -0.64544677734375, -0.6169967651367188, -0.5885467529296875, -0.5600967407226562, -0.531646728515625, -0.5031967163085938, -0.4747467041015625, -0.44629669189453125, -0.4178466796875, -0.38939666748046875, -0.3609466552734375, -0.33249664306640625, -0.304046630859375, -0.27559661865234375, -0.2471466064453125, -0.21869659423828125, -0.19024658203125, -0.16179656982421875, -0.1333465576171875, -0.10489654541015625, -0.076446533203125, -0.04799652099609375, -0.0195465087890625, 0.00890350341796875, 0.037353515625, 0.06580352783203125, 0.0942535400390625, 0.12270355224609375, 0.151153564453125, 0.17960357666015625, 0.2080535888671875, 0.23650360107421875, 0.26495361328125, 0.29340362548828125, 0.3218536376953125, 0.35030364990234375, 0.378753662109375, 0.40720367431640625, 0.4356536865234375, 0.46410369873046875, 0.4925537109375, 0.5210037231445312, 0.5494537353515625, 0.5779037475585938, 0.606353759765625, 0.6348037719726562, 0.6632537841796875, 0.6917037963867188, 0.72015380859375, 0.7486038208007812, 0.7770538330078125, 0.8055038452148438, 0.833953857421875, 0.8624038696289062, 0.8908538818359375, 0.9193038940429688, 0.94775390625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 9.0, 10.0, 10.0, 8.0, 8.0, 9.0, 21.0, 26.0, 28.0, 27.0, 39.0, 38.0, 32.0, 43.0, 50.0, 47.0, 41.0, 45.0, 1079.0, 49.0, 38.0, 50.0, 44.0, 51.0, 23.0, 29.0, 23.0, 24.0, 30.0, 11.0, 20.0, 16.0, 9.0, 8.0, 9.0, 3.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.984375, -18.362060546875, -17.73974609375, -17.117431640625, -16.4951171875, -15.872802734375, -15.25048828125, -14.628173828125, -14.005859375, -13.383544921875, -12.76123046875, -12.138916015625, -11.5166015625, -10.894287109375, -10.27197265625, -9.649658203125, -9.02734375, -8.405029296875, -7.78271484375, -7.160400390625, -6.5380859375, -5.915771484375, -5.29345703125, -4.671142578125, -4.048828125, -3.426513671875, -2.80419921875, -2.181884765625, -1.5595703125, -0.937255859375, -0.31494140625, 0.307373046875, 0.9296875, 1.552001953125, 2.17431640625, 2.796630859375, 3.4189453125, 4.041259765625, 4.66357421875, 5.285888671875, 5.908203125, 6.530517578125, 7.15283203125, 7.775146484375, 8.3974609375, 9.019775390625, 9.64208984375, 10.264404296875, 10.88671875, 11.509033203125, 12.13134765625, 12.753662109375, 13.3759765625, 13.998291015625, 14.62060546875, 15.242919921875, 15.865234375, 16.487548828125, 17.10986328125, 17.732177734375, 18.3544921875, 18.976806640625, 19.59912109375, 20.221435546875, 20.84375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 9.0, 14.0, 15.0, 32.0, 38.0, 59.0, 87.0, 111.0, 134.0, 242.0, 338.0, 477.0, 726.0, 1087.0, 1634.0, 2571.0, 3917.0, 6468.0, 10081.0, 16615.0, 26739.0, 44445.0, 76255.0, 135098.0, 247824.0, 452681.0, 3756748.0, 676364.0, 363431.0, 198416.0, 108816.0, 62821.0, 36818.0, 22407.0, 13659.0, 8539.0, 5480.0, 3474.0, 2308.0, 1426.0, 1026.0, 657.0, 404.0, 274.0, 209.0, 156.0, 102.0, 62.0, 46.0, 29.0, 18.0, 25.0, 14.0, 4.0, 2.0, 3.0, 4.0, 2.0], "bins": [-0.833984375, -0.8085708618164062, -0.7831573486328125, -0.7577438354492188, -0.732330322265625, -0.7069168090820312, -0.6815032958984375, -0.6560897827148438, -0.63067626953125, -0.6052627563476562, -0.5798492431640625, -0.5544357299804688, -0.529022216796875, -0.5036087036132812, -0.4781951904296875, -0.45278167724609375, -0.4273681640625, -0.40195465087890625, -0.3765411376953125, -0.35112762451171875, -0.325714111328125, -0.30030059814453125, -0.2748870849609375, -0.24947357177734375, -0.22406005859375, -0.19864654541015625, -0.1732330322265625, -0.14781951904296875, -0.122406005859375, -0.09699249267578125, -0.0715789794921875, -0.04616546630859375, -0.020751953125, 0.00466156005859375, 0.0300750732421875, 0.05548858642578125, 0.080902099609375, 0.10631561279296875, 0.1317291259765625, 0.15714263916015625, 0.18255615234375, 0.20796966552734375, 0.2333831787109375, 0.25879669189453125, 0.284210205078125, 0.30962371826171875, 0.3350372314453125, 0.36045074462890625, 0.3858642578125, 0.41127777099609375, 0.4366912841796875, 0.46210479736328125, 0.487518310546875, 0.5129318237304688, 0.5383453369140625, 0.5637588500976562, 0.58917236328125, 0.6145858764648438, 0.6399993896484375, 0.6654129028320312, 0.690826416015625, 0.7162399291992188, 0.7416534423828125, 0.7670669555664062, 0.79248046875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 9.0, 4.0, 8.0, 5.0, 12.0, 14.0, 14.0, 17.0, 20.0, 24.0, 17.0, 22.0, 24.0, 34.0, 42.0, 21.0, 40.0, 44.0, 39.0, 50.0, 337.0, 780.0, 32.0, 43.0, 41.0, 44.0, 37.0, 39.0, 22.0, 25.0, 29.0, 31.0, 12.0, 16.0, 13.0, 12.0, 11.0, 5.0, 11.0, 6.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.2421875, -11.8603515625, -11.478515625, -11.0966796875, -10.71484375, -10.3330078125, -9.951171875, -9.5693359375, -9.1875, -8.8056640625, -8.423828125, -8.0419921875, -7.66015625, -7.2783203125, -6.896484375, -6.5146484375, -6.1328125, -5.7509765625, -5.369140625, -4.9873046875, -4.60546875, -4.2236328125, -3.841796875, -3.4599609375, -3.078125, -2.6962890625, -2.314453125, -1.9326171875, -1.55078125, -1.1689453125, -0.787109375, -0.4052734375, -0.0234375, 0.3583984375, 0.740234375, 1.1220703125, 1.50390625, 1.8857421875, 2.267578125, 2.6494140625, 3.03125, 3.4130859375, 3.794921875, 4.1767578125, 4.55859375, 4.9404296875, 5.322265625, 5.7041015625, 6.0859375, 6.4677734375, 6.849609375, 7.2314453125, 7.61328125, 7.9951171875, 8.376953125, 8.7587890625, 9.140625, 9.5224609375, 9.904296875, 10.2861328125, 10.66796875, 11.0498046875, 11.431640625, 11.8134765625, 12.1953125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 9.0, 6.0, 7.0, 17.0, 21.0, 38.0, 45.0, 67.0, 105.0, 153.0, 202.0, 283.0, 394.0, 618.0, 928.0, 1389.0, 2147.0, 3430.0, 5529.0, 8960.0, 15010.0, 25573.0, 45742.0, 85658.0, 176357.0, 401728.0, 3731261.0, 1093221.0, 353289.0, 157570.0, 78378.0, 42430.0, 24061.0, 14001.0, 8308.0, 5138.0, 3090.0, 2121.0, 1356.0, 896.0, 585.0, 412.0, 292.0, 183.0, 146.0, 85.0, 65.0, 40.0, 31.0, 19.0, 14.0, 8.0, 6.0, 6.0, 10.0, 5.0, 1.0, 0.0, 1.0], "bins": [-1.0693359375, -1.0358428955078125, -1.002349853515625, -0.9688568115234375, -0.93536376953125, -0.9018707275390625, -0.868377685546875, -0.8348846435546875, -0.8013916015625, -0.7678985595703125, -0.734405517578125, -0.7009124755859375, -0.66741943359375, -0.6339263916015625, -0.600433349609375, -0.5669403076171875, -0.533447265625, -0.4999542236328125, -0.466461181640625, -0.4329681396484375, -0.39947509765625, -0.3659820556640625, -0.332489013671875, -0.2989959716796875, -0.2655029296875, -0.2320098876953125, -0.198516845703125, -0.1650238037109375, -0.13153076171875, -0.0980377197265625, -0.064544677734375, -0.0310516357421875, 0.00244140625, 0.0359344482421875, 0.069427490234375, 0.1029205322265625, 0.13641357421875, 0.1699066162109375, 0.203399658203125, 0.2368927001953125, 0.2703857421875, 0.3038787841796875, 0.337371826171875, 0.3708648681640625, 0.40435791015625, 0.4378509521484375, 0.471343994140625, 0.5048370361328125, 0.538330078125, 0.5718231201171875, 0.605316162109375, 0.6388092041015625, 0.67230224609375, 0.7057952880859375, 0.739288330078125, 0.7727813720703125, 0.8062744140625, 0.8397674560546875, 0.873260498046875, 0.9067535400390625, 0.94024658203125, 0.9737396240234375, 1.007232666015625, 1.0407257080078125, 1.07421875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 5.0, 8.0, 4.0, 5.0, 6.0, 11.0, 14.0, 15.0, 10.0, 22.0, 23.0, 24.0, 29.0, 32.0, 31.0, 33.0, 32.0, 50.0, 34.0, 35.0, 40.0, 841.0, 267.0, 44.0, 37.0, 33.0, 35.0, 32.0, 48.0, 28.0, 26.0, 26.0, 21.0, 18.0, 15.0, 19.0, 14.0, 11.0, 8.0, 9.0, 6.0, 10.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.6729736328125, -7.416259765625, -7.1595458984375, -6.90283203125, -6.6461181640625, -6.389404296875, -6.1326904296875, -5.8759765625, -5.6192626953125, -5.362548828125, -5.1058349609375, -4.84912109375, -4.5924072265625, -4.335693359375, -4.0789794921875, -3.822265625, -3.5655517578125, -3.308837890625, -3.0521240234375, -2.79541015625, -2.5386962890625, -2.281982421875, -2.0252685546875, -1.7685546875, -1.5118408203125, -1.255126953125, -0.9984130859375, -0.74169921875, -0.4849853515625, -0.228271484375, 0.0284423828125, 0.28515625, 0.5418701171875, 0.798583984375, 1.0552978515625, 1.31201171875, 1.5687255859375, 1.825439453125, 2.0821533203125, 2.3388671875, 2.5955810546875, 2.852294921875, 3.1090087890625, 3.36572265625, 3.6224365234375, 3.879150390625, 4.1358642578125, 4.392578125, 4.6492919921875, 4.906005859375, 5.1627197265625, 5.41943359375, 5.6761474609375, 5.932861328125, 6.1895751953125, 6.4462890625, 6.7030029296875, 6.959716796875, 7.2164306640625, 7.47314453125, 7.7298583984375, 7.986572265625, 8.2432861328125, 8.5]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 7.0, 23.0, 72.0, 298.0, 421.0, 129.0, 38.0, 12.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-29.07339859008789, -28.52666664123535, -27.979936599731445, -27.433204650878906, -26.886474609375, -26.33974266052246, -25.793010711669922, -25.246280670166016, -24.699548721313477, -24.152816772460938, -23.60608673095703, -23.059354782104492, -22.512624740600586, -21.965892791748047, -21.41916275024414, -20.8724308013916, -20.325698852539062, -19.778966903686523, -19.232236862182617, -18.685504913330078, -18.138774871826172, -17.592042922973633, -17.045310974121094, -16.498580932617188, -15.951850891113281, -15.405119895935059, -14.858388900756836, -14.311656951904297, -13.764925956726074, -13.218194961547852, -12.671463966369629, -12.124732971191406, -11.578001022338867, -11.031270027160645, -10.484539031982422, -9.937807083129883, -9.39107608795166, -8.844345092773438, -8.297614097595215, -7.750883102416992, -7.204151630401611, -6.657420635223389, -6.110689163208008, -5.563958168029785, -5.0172271728515625, -4.470495700836182, -3.923764705657959, -3.3770334720611572, -2.8303022384643555, -2.2835710048675537, -1.7368398904800415, -1.1901087760925293, -0.6433775424957275, -0.09664630889892578, 0.4500846862792969, 0.9968159198760986, 1.5435471534729004, 2.090278387069702, 2.637009620666504, 3.1837406158447266, 3.7304718494415283, 4.27720308303833, 4.823934078216553, 5.370665550231934, 5.917396545410156]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 7.0, 5.0, 3.0, 10.0, 9.0, 13.0, 21.0, 18.0, 22.0, 21.0, 25.0, 27.0, 39.0, 33.0, 37.0, 26.0, 42.0, 20.0, 33.0, 32.0, 39.0, 51.0, 34.0, 42.0, 55.0, 37.0, 45.0, 31.0, 22.0, 25.0, 17.0, 21.0, 19.0, 21.0, 15.0, 22.0, 13.0, 5.0, 11.0, 7.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.089702606201172, -11.727959632873535, -11.366217613220215, -11.004474639892578, -10.642732620239258, -10.280989646911621, -9.919246673583984, -9.557504653930664, -9.195762634277344, -8.834019660949707, -8.472277641296387, -8.11053466796875, -7.74879264831543, -7.387049674987793, -7.0253071784973145, -6.663564682006836, -6.301821708679199, -5.940079212188721, -5.578336715698242, -5.2165937423706055, -4.854851722717285, -4.493108749389648, -4.13136625289917, -3.7696237564086914, -3.407881259918213, -3.0461387634277344, -2.684396266937256, -2.3226535320281982, -1.9609110355377197, -1.5991685390472412, -1.2374258041381836, -0.8756833076477051, -0.513941764831543, -0.15219920873641968, 0.2095433473587036, 0.5712859630584717, 0.9330284595489502, 1.2947709560394287, 1.6565136909484863, 2.018256187438965, 2.3799986839294434, 2.741741180419922, 3.1034836769104004, 3.465226411819458, 3.8269689083099365, 4.188711166381836, 4.550454139709473, 4.912196636199951, 5.27393913269043, 5.635681629180908, 5.997424125671387, 6.359167098999023, 6.720909118652344, 7.0826520919799805, 7.444394588470459, 7.8061370849609375, 8.167879104614258, 8.529622077941895, 8.891364097595215, 9.253107070922852, 9.614849090576172, 9.976592063903809, 10.338335037231445, 10.700077056884766, 11.061820030212402]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 1.0, 8.0, 4.0, 5.0, 5.0, 5.0, 7.0, 9.0, 15.0, 20.0, 39.0, 71.0, 133.0, 227.0, 345.0, 493.0, 700.0, 1098.0, 1688.0, 2994.0, 5787.0, 11646.0, 24993.0, 60640.0, 1051251.0, 2896257.0, 79195.0, 28004.0, 13064.0, 7124.0, 3599.0, 1907.0, 1087.0, 647.0, 436.0, 320.0, 202.0, 97.0, 58.0, 20.0, 22.0, 12.0, 5.0, 8.0, 8.0, 2.0, 4.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.36865234375, -0.35784149169921875, -0.3470306396484375, -0.33621978759765625, -0.325408935546875, -0.31459808349609375, -0.3037872314453125, -0.29297637939453125, -0.28216552734375, -0.27135467529296875, -0.2605438232421875, -0.24973297119140625, -0.238922119140625, -0.22811126708984375, -0.2173004150390625, -0.20648956298828125, -0.1956787109375, -0.18486785888671875, -0.1740570068359375, -0.16324615478515625, -0.152435302734375, -0.14162445068359375, -0.1308135986328125, -0.12000274658203125, -0.10919189453125, -0.09838104248046875, -0.0875701904296875, -0.07675933837890625, -0.065948486328125, -0.05513763427734375, -0.0443267822265625, -0.03351593017578125, -0.022705078125, -0.01189422607421875, -0.0010833740234375, 0.00972747802734375, 0.020538330078125, 0.03134918212890625, 0.0421600341796875, 0.05297088623046875, 0.06378173828125, 0.07459259033203125, 0.0854034423828125, 0.09621429443359375, 0.107025146484375, 0.11783599853515625, 0.1286468505859375, 0.13945770263671875, 0.1502685546875, 0.16107940673828125, 0.1718902587890625, 0.18270111083984375, 0.193511962890625, 0.20432281494140625, 0.2151336669921875, 0.22594451904296875, 0.23675537109375, 0.24756622314453125, 0.2583770751953125, 0.26918792724609375, 0.279998779296875, 0.29080963134765625, 0.3016204833984375, 0.31243133544921875, 0.3232421875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 3.0, 12.0, 7.0, 13.0, 21.0, 16.0, 22.0, 27.0, 35.0, 34.0, 38.0, 48.0, 51.0, 45.0, 54.0, 55.0, 70.0, 66.0, 62.0, 56.0, 43.0, 34.0, 29.0, 28.0, 14.0, 15.0, 14.0, 16.0, 17.0, 14.0, 4.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.08099365234375, -0.07858657836914062, -0.07617950439453125, -0.07377243041992188, -0.0713653564453125, -0.06895828247070312, -0.06655120849609375, -0.06414413452148438, -0.061737060546875, -0.059329986572265625, -0.05692291259765625, -0.054515838623046875, -0.0521087646484375, -0.049701690673828125, -0.04729461669921875, -0.044887542724609375, -0.04248046875, -0.040073394775390625, -0.03766632080078125, -0.035259246826171875, -0.0328521728515625, -0.030445098876953125, -0.02803802490234375, -0.025630950927734375, -0.023223876953125, -0.020816802978515625, -0.01840972900390625, -0.016002655029296875, -0.0135955810546875, -0.011188507080078125, -0.00878143310546875, -0.006374359130859375, -0.00396728515625, -0.001560211181640625, 0.00084686279296875, 0.003253936767578125, 0.0056610107421875, 0.008068084716796875, 0.01047515869140625, 0.012882232666015625, 0.015289306640625, 0.017696380615234375, 0.02010345458984375, 0.022510528564453125, 0.0249176025390625, 0.027324676513671875, 0.02973175048828125, 0.032138824462890625, 0.0345458984375, 0.036952972412109375, 0.03936004638671875, 0.041767120361328125, 0.0441741943359375, 0.046581268310546875, 0.04898834228515625, 0.051395416259765625, 0.053802490234375, 0.056209564208984375, 0.05861663818359375, 0.061023712158203125, 0.0634307861328125, 0.06583786010742188, 0.06824493408203125, 0.07065200805664062, 0.07305908203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 8.0, 10.0, 10.0, 23.0, 24.0, 23.0, 36.0, 55.0, 92.0, 489.0, 26703.0, 4161125.0, 5202.0, 191.0, 85.0, 35.0, 33.0, 24.0, 16.0, 16.0, 10.0, 8.0, 5.0, 12.0, 4.0, 4.0, 6.0, 1.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99560546875, -0.9657363891601562, -0.9358673095703125, -0.9059982299804688, -0.876129150390625, -0.8462600708007812, -0.8163909912109375, -0.7865219116210938, -0.75665283203125, -0.7267837524414062, -0.6969146728515625, -0.6670455932617188, -0.637176513671875, -0.6073074340820312, -0.5774383544921875, -0.5475692749023438, -0.5177001953125, -0.48783111572265625, -0.4579620361328125, -0.42809295654296875, -0.398223876953125, -0.36835479736328125, -0.3384857177734375, -0.30861663818359375, -0.27874755859375, -0.24887847900390625, -0.2190093994140625, -0.18914031982421875, -0.159271240234375, -0.12940216064453125, -0.0995330810546875, -0.06966400146484375, -0.039794921875, -0.00992584228515625, 0.0199432373046875, 0.04981231689453125, 0.079681396484375, 0.10955047607421875, 0.1394195556640625, 0.16928863525390625, 0.19915771484375, 0.22902679443359375, 0.2588958740234375, 0.28876495361328125, 0.318634033203125, 0.34850311279296875, 0.3783721923828125, 0.40824127197265625, 0.4381103515625, 0.46797943115234375, 0.4978485107421875, 0.5277175903320312, 0.557586669921875, 0.5874557495117188, 0.6173248291015625, 0.6471939086914062, 0.67706298828125, 0.7069320678710938, 0.7368011474609375, 0.7666702270507812, 0.796539306640625, 0.8264083862304688, 0.8562774658203125, 0.8861465454101562, 0.916015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 3.0, 4.0, 8.0, 9.0, 5.0, 8.0, 16.0, 11.0, 22.0, 27.0, 33.0, 51.0, 90.0, 176.0, 866.0, 1922.0, 416.0, 141.0, 65.0, 44.0, 36.0, 17.0, 26.0, 19.0, 11.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2088623046875, -0.2019634246826172, -0.19506454467773438, -0.18816566467285156, -0.18126678466796875, -0.17436790466308594, -0.16746902465820312, -0.1605701446533203, -0.1536712646484375, -0.1467723846435547, -0.13987350463867188, -0.13297462463378906, -0.12607574462890625, -0.11917686462402344, -0.11227798461914062, -0.10537910461425781, -0.098480224609375, -0.09158134460449219, -0.08468246459960938, -0.07778358459472656, -0.07088470458984375, -0.06398582458496094, -0.057086944580078125, -0.05018806457519531, -0.0432891845703125, -0.03639030456542969, -0.029491424560546875, -0.022592544555664062, -0.01569366455078125, -0.008794784545898438, -0.001895904541015625, 0.0050029754638671875, 0.01190185546875, 0.018800735473632812, 0.025699615478515625, 0.03259849548339844, 0.03949737548828125, 0.04639625549316406, 0.053295135498046875, 0.06019401550292969, 0.0670928955078125, 0.07399177551269531, 0.08089065551757812, 0.08778953552246094, 0.09468841552734375, 0.10158729553222656, 0.10848617553710938, 0.11538505554199219, 0.122283935546875, 0.1291828155517578, 0.13608169555664062, 0.14298057556152344, 0.14987945556640625, 0.15677833557128906, 0.16367721557617188, 0.1705760955810547, 0.1774749755859375, 0.1843738555908203, 0.19127273559570312, 0.19817161560058594, 0.20507049560546875, 0.21196937561035156, 0.21886825561523438, 0.2257671356201172, 0.232666015625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 9.0, 11.0, 22.0, 35.0, 78.0, 156.0, 249.0, 226.0, 104.0, 49.0, 30.0, 17.0, 5.0, 6.0, 4.0, 4.0, 1.0], "bins": [-0.5707597732543945, -0.5601474046707153, -0.5495350956916809, -0.5389227271080017, -0.5283104181289673, -0.5176980495452881, -0.5070857405662537, -0.49647337198257446, -0.48586103320121765, -0.47524869441986084, -0.46463635563850403, -0.4540240168571472, -0.443411648273468, -0.4327993094921112, -0.4221869707107544, -0.4115746319293976, -0.40096229314804077, -0.39034995436668396, -0.37973761558532715, -0.36912527680397034, -0.3585129380226135, -0.3479005694389343, -0.3372882306575775, -0.3266758918762207, -0.3160635530948639, -0.3054512143135071, -0.29483887553215027, -0.28422653675079346, -0.27361416816711426, -0.26300182938575745, -0.25238949060440063, -0.24177715182304382, -0.231164813041687, -0.2205524742603302, -0.2099401354789734, -0.19932778179645538, -0.18871544301509857, -0.17810310423374176, -0.16749075055122375, -0.15687841176986694, -0.14626607298851013, -0.13565373420715332, -0.1250413954257965, -0.1144290417432785, -0.10381670296192169, -0.09320436418056488, -0.08259201794862747, -0.07197967171669006, -0.06136733293533325, -0.05075499042868614, -0.04014264792203903, -0.029530305415391922, -0.018917962908744812, -0.008305620402097702, 0.002306722104549408, 0.012919068336486816, 0.023531407117843628, 0.03414374962449074, 0.04475609213113785, 0.05536843463778496, 0.06598077714443207, 0.07659311592578888, 0.08720546215772629, 0.0978178083896637, 0.10843014717102051]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 8.0, 12.0, 12.0, 15.0, 20.0, 23.0, 25.0, 39.0, 38.0, 48.0, 55.0, 59.0, 57.0, 75.0, 62.0, 68.0, 63.0, 61.0, 55.0, 43.0, 21.0, 22.0, 31.0, 21.0, 14.0, 13.0, 10.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.45400798320770264, -0.43871253728866577, -0.4234170913696289, -0.40812167525291443, -0.39282622933387756, -0.3775307834148407, -0.3622353672981262, -0.34693992137908936, -0.3316444754600525, -0.3163490295410156, -0.30105358362197876, -0.2857581675052643, -0.2704627215862274, -0.25516727566719055, -0.23987184464931488, -0.2245764136314392, -0.20928096771240234, -0.19398552179336548, -0.1786900907754898, -0.16339465975761414, -0.14809921383857727, -0.1328037679195404, -0.11750833690166473, -0.10221289843320847, -0.0869174599647522, -0.07162202149629593, -0.05632658302783966, -0.04103114455938339, -0.025735706090927124, -0.010440267622470856, 0.004855170845985413, 0.02015060931444168, 0.03544604778289795, 0.05074148625135422, 0.06603692471981049, 0.08133236318826675, 0.09662780165672302, 0.11192324012517929, 0.12721867859363556, 0.14251410961151123, 0.1578095555305481, 0.17310500144958496, 0.18840043246746063, 0.2036958634853363, 0.21899130940437317, 0.23428675532341003, 0.2495821863412857, 0.2648776173591614, 0.28017306327819824, 0.2954685091972351, 0.310763955116272, 0.32605937123298645, 0.3413548171520233, 0.3566502630710602, 0.37194567918777466, 0.3872411251068115, 0.4025365710258484, 0.41783201694488525, 0.4331274628639221, 0.4484228789806366, 0.46371832489967346, 0.4790137708187103, 0.4943091869354248, 0.5096046328544617, 0.5249000787734985]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 4.0, 11.0, 12.0, 22.0, 22.0, 52.0, 58.0, 83.0, 133.0, 156.0, 241.0, 352.0, 581.0, 995.0, 1597.0, 3050.0, 6680.0, 17417.0, 82462.0, 824674.0, 79222.0, 16798.0, 6497.0, 3081.0, 1654.0, 988.0, 580.0, 331.0, 229.0, 150.0, 117.0, 84.0, 42.0, 53.0, 30.0, 11.0, 20.0, 13.0, 7.0, 5.0, 6.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.1328125, -1.0979461669921875, -1.063079833984375, -1.0282135009765625, -0.99334716796875, -0.9584808349609375, -0.923614501953125, -0.8887481689453125, -0.8538818359375, -0.8190155029296875, -0.784149169921875, -0.7492828369140625, -0.71441650390625, -0.6795501708984375, -0.644683837890625, -0.6098175048828125, -0.574951171875, -0.5400848388671875, -0.505218505859375, -0.4703521728515625, -0.43548583984375, -0.4006195068359375, -0.365753173828125, -0.3308868408203125, -0.2960205078125, -0.2611541748046875, -0.226287841796875, -0.1914215087890625, -0.15655517578125, -0.1216888427734375, -0.086822509765625, -0.0519561767578125, -0.01708984375, 0.0177764892578125, 0.052642822265625, 0.0875091552734375, 0.12237548828125, 0.1572418212890625, 0.192108154296875, 0.2269744873046875, 0.2618408203125, 0.2967071533203125, 0.331573486328125, 0.3664398193359375, 0.40130615234375, 0.4361724853515625, 0.471038818359375, 0.5059051513671875, 0.540771484375, 0.5756378173828125, 0.610504150390625, 0.6453704833984375, 0.68023681640625, 0.7151031494140625, 0.749969482421875, 0.7848358154296875, 0.8197021484375, 0.8545684814453125, 0.889434814453125, 0.9243011474609375, 0.95916748046875, 0.9940338134765625, 1.028900146484375, 1.0637664794921875, 1.0986328125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 0.0, 3.0, 10.0, 14.0, 13.0, 17.0, 14.0, 25.0, 27.0, 42.0, 31.0, 32.0, 58.0, 36.0, 45.0, 62.0, 63.0, 65.0, 58.0, 62.0, 53.0, 41.0, 32.0, 27.0, 26.0, 21.0, 14.0, 16.0, 14.0, 18.0, 14.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07208251953125, -0.06980037689208984, -0.06751823425292969, -0.06523609161376953, -0.06295394897460938, -0.06067180633544922, -0.05838966369628906, -0.056107521057128906, -0.05382537841796875, -0.051543235778808594, -0.04926109313964844, -0.04697895050048828, -0.044696807861328125, -0.04241466522216797, -0.04013252258300781, -0.037850379943847656, -0.0355682373046875, -0.033286094665527344, -0.031003952026367188, -0.02872180938720703, -0.026439666748046875, -0.02415752410888672, -0.021875381469726562, -0.019593238830566406, -0.01731109619140625, -0.015028953552246094, -0.012746810913085938, -0.010464668273925781, -0.008182525634765625, -0.005900382995605469, -0.0036182403564453125, -0.0013360977172851562, 0.000946044921875, 0.0032281875610351562, 0.0055103302001953125, 0.007792472839355469, 0.010074615478515625, 0.012356758117675781, 0.014638900756835938, 0.016921043395996094, 0.01920318603515625, 0.021485328674316406, 0.023767471313476562, 0.02604961395263672, 0.028331756591796875, 0.03061389923095703, 0.03289604187011719, 0.035178184509277344, 0.0374603271484375, 0.039742469787597656, 0.04202461242675781, 0.04430675506591797, 0.046588897705078125, 0.04887104034423828, 0.05115318298339844, 0.053435325622558594, 0.05571746826171875, 0.057999610900878906, 0.06028175354003906, 0.06256389617919922, 0.06484603881835938, 0.06712818145751953, 0.06941032409667969, 0.07169246673583984, 0.073974609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 1.0, 9.0, 11.0, 10.0, 15.0, 12.0, 23.0, 30.0, 37.0, 39.0, 67.0, 83.0, 113.0, 186.0, 254.0, 382.0, 538.0, 870.0, 1444.0, 2514.0, 4521.0, 9643.0, 23277.0, 68735.0, 317441.0, 471623.0, 92963.0, 29100.0, 11709.0, 5553.0, 2842.0, 1557.0, 943.0, 625.0, 389.0, 275.0, 186.0, 141.0, 104.0, 72.0, 55.0, 44.0, 37.0, 21.0, 9.0, 13.0, 11.0, 8.0, 9.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.283447265625, -0.2743377685546875, -0.265228271484375, -0.2561187744140625, -0.24700927734375, -0.2378997802734375, -0.228790283203125, -0.2196807861328125, -0.2105712890625, -0.2014617919921875, -0.192352294921875, -0.1832427978515625, -0.17413330078125, -0.1650238037109375, -0.155914306640625, -0.1468048095703125, -0.1376953125, -0.1285858154296875, -0.119476318359375, -0.1103668212890625, -0.10125732421875, -0.0921478271484375, -0.083038330078125, -0.0739288330078125, -0.0648193359375, -0.0557098388671875, -0.046600341796875, -0.0374908447265625, -0.02838134765625, -0.0192718505859375, -0.010162353515625, -0.0010528564453125, 0.008056640625, 0.0171661376953125, 0.026275634765625, 0.0353851318359375, 0.04449462890625, 0.0536041259765625, 0.062713623046875, 0.0718231201171875, 0.0809326171875, 0.0900421142578125, 0.099151611328125, 0.1082611083984375, 0.11737060546875, 0.1264801025390625, 0.135589599609375, 0.1446990966796875, 0.15380859375, 0.1629180908203125, 0.172027587890625, 0.1811370849609375, 0.19024658203125, 0.1993560791015625, 0.208465576171875, 0.2175750732421875, 0.2266845703125, 0.2357940673828125, 0.244903564453125, 0.2540130615234375, 0.26312255859375, 0.2722320556640625, 0.281341552734375, 0.2904510498046875, 0.299560546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 13.0, 7.0, 7.0, 11.0, 15.0, 11.0, 29.0, 31.0, 27.0, 26.0, 33.0, 30.0, 40.0, 51.0, 40.0, 30.0, 44.0, 48.0, 45.0, 37.0, 37.0, 43.0, 39.0, 30.0, 28.0, 32.0, 32.0, 23.0, 19.0, 24.0, 15.0, 18.0, 11.0, 10.0, 10.0, 5.0, 9.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1739501953125, -0.16814231872558594, -0.16233444213867188, -0.1565265655517578, -0.15071868896484375, -0.1449108123779297, -0.13910293579101562, -0.13329505920410156, -0.1274871826171875, -0.12167930603027344, -0.11587142944335938, -0.11006355285644531, -0.10425567626953125, -0.09844779968261719, -0.09263992309570312, -0.08683204650878906, -0.081024169921875, -0.07521629333496094, -0.06940841674804688, -0.06360054016113281, -0.05779266357421875, -0.05198478698730469, -0.046176910400390625, -0.04036903381347656, -0.0345611572265625, -0.028753280639648438, -0.022945404052734375, -0.017137527465820312, -0.01132965087890625, -0.0055217742919921875, 0.000286102294921875, 0.0060939788818359375, 0.01190185546875, 0.017709732055664062, 0.023517608642578125, 0.029325485229492188, 0.03513336181640625, 0.04094123840332031, 0.046749114990234375, 0.05255699157714844, 0.0583648681640625, 0.06417274475097656, 0.06998062133789062, 0.07578849792480469, 0.08159637451171875, 0.08740425109863281, 0.09321212768554688, 0.09902000427246094, 0.104827880859375, 0.11063575744628906, 0.11644363403320312, 0.12225151062011719, 0.12805938720703125, 0.1338672637939453, 0.13967514038085938, 0.14548301696777344, 0.1512908935546875, 0.15709877014160156, 0.16290664672851562, 0.1687145233154297, 0.17452239990234375, 0.1803302764892578, 0.18613815307617188, 0.19194602966308594, 0.19775390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 8.0, 6.0, 22.0, 9.0, 28.0, 38.0, 42.0, 69.0, 98.0, 132.0, 215.0, 375.0, 633.0, 1188.0, 2575.0, 6413.0, 22891.0, 828161.0, 160166.0, 15902.0, 4966.0, 2061.0, 1019.0, 556.0, 351.0, 186.0, 141.0, 89.0, 72.0, 30.0, 36.0, 15.0, 16.0, 8.0, 10.0, 4.0, 4.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20458984375, -0.19817161560058594, -0.19175338745117188, -0.1853351593017578, -0.17891693115234375, -0.1724987030029297, -0.16608047485351562, -0.15966224670410156, -0.1532440185546875, -0.14682579040527344, -0.14040756225585938, -0.1339893341064453, -0.12757110595703125, -0.12115287780761719, -0.11473464965820312, -0.10831642150878906, -0.101898193359375, -0.09547996520996094, -0.08906173706054688, -0.08264350891113281, -0.07622528076171875, -0.06980705261230469, -0.06338882446289062, -0.05697059631347656, -0.0505523681640625, -0.04413414001464844, -0.037715911865234375, -0.03129768371582031, -0.02487945556640625, -0.018461227416992188, -0.012042999267578125, -0.0056247711181640625, 0.00079345703125, 0.0072116851806640625, 0.013629913330078125, 0.020048141479492188, 0.02646636962890625, 0.03288459777832031, 0.039302825927734375, 0.04572105407714844, 0.0521392822265625, 0.05855751037597656, 0.06497573852539062, 0.07139396667480469, 0.07781219482421875, 0.08423042297363281, 0.09064865112304688, 0.09706687927246094, 0.103485107421875, 0.10990333557128906, 0.11632156372070312, 0.12273979187011719, 0.12915802001953125, 0.1355762481689453, 0.14199447631835938, 0.14841270446777344, 0.1548309326171875, 0.16124916076660156, 0.16766738891601562, 0.1740856170654297, 0.18050384521484375, 0.1869220733642578, 0.19334030151367188, 0.19975852966308594, 0.2061767578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 10.0, 5.0, 20.0, 97.0, 463.0, 301.0, 50.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8100948333740234e-05, -4.663597792387009e-05, -4.517100751399994e-05, -4.370603710412979e-05, -4.2241066694259644e-05, -4.0776096284389496e-05, -3.931112587451935e-05, -3.78461554646492e-05, -3.638118505477905e-05, -3.4916214644908905e-05, -3.345124423503876e-05, -3.198627382516861e-05, -3.052130341529846e-05, -2.9056333005428314e-05, -2.7591362595558167e-05, -2.612639218568802e-05, -2.466142177581787e-05, -2.3196451365947723e-05, -2.1731480956077576e-05, -2.0266510546207428e-05, -1.880154013633728e-05, -1.7336569726467133e-05, -1.5871599316596985e-05, -1.4406628906726837e-05, -1.294165849685669e-05, -1.1476688086986542e-05, -1.0011717677116394e-05, -8.546747267246246e-06, -7.081776857376099e-06, -5.616806447505951e-06, -4.151836037635803e-06, -2.6868656277656555e-06, -1.2218952178955078e-06, 2.430751919746399e-07, 1.7080456018447876e-06, 3.1730160117149353e-06, 4.637986421585083e-06, 6.102956831455231e-06, 7.567927241325378e-06, 9.032897651195526e-06, 1.0497868061065674e-05, 1.1962838470935822e-05, 1.342780888080597e-05, 1.4892779290676117e-05, 1.6357749700546265e-05, 1.7822720110416412e-05, 1.928769052028656e-05, 2.0752660930156708e-05, 2.2217631340026855e-05, 2.3682601749897003e-05, 2.514757215976715e-05, 2.66125425696373e-05, 2.8077512979507446e-05, 2.9542483389377594e-05, 3.100745379924774e-05, 3.247242420911789e-05, 3.393739461898804e-05, 3.5402365028858185e-05, 3.686733543872833e-05, 3.833230584859848e-05, 3.979727625846863e-05, 4.1262246668338776e-05, 4.272721707820892e-05, 4.419218748807907e-05, 4.565715789794922e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 4.0, 4.0, 11.0, 9.0, 26.0, 34.0, 77.0, 223.0, 581.0, 1736.0, 6179.0, 29638.0, 950591.0, 47372.0, 8553.0, 2286.0, 715.0, 278.0, 106.0, 50.0, 15.0, 19.0, 10.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.53564453125, -0.5206031799316406, -0.5055618286132812, -0.4905204772949219, -0.4754791259765625, -0.4604377746582031, -0.44539642333984375, -0.4303550720214844, -0.415313720703125, -0.4002723693847656, -0.38523101806640625, -0.3701896667480469, -0.3551483154296875, -0.3401069641113281, -0.32506561279296875, -0.3100242614746094, -0.29498291015625, -0.2799415588378906, -0.26490020751953125, -0.24985885620117188, -0.2348175048828125, -0.21977615356445312, -0.20473480224609375, -0.18969345092773438, -0.174652099609375, -0.15961074829101562, -0.14456939697265625, -0.12952804565429688, -0.1144866943359375, -0.09944534301757812, -0.08440399169921875, -0.06936264038085938, -0.0543212890625, -0.039279937744140625, -0.02423858642578125, -0.009197235107421875, 0.0058441162109375, 0.020885467529296875, 0.03592681884765625, 0.050968170166015625, 0.066009521484375, 0.08105087280273438, 0.09609222412109375, 0.11113357543945312, 0.1261749267578125, 0.14121627807617188, 0.15625762939453125, 0.17129898071289062, 0.18634033203125, 0.20138168334960938, 0.21642303466796875, 0.23146438598632812, 0.2465057373046875, 0.2615470886230469, 0.27658843994140625, 0.2916297912597656, 0.306671142578125, 0.3217124938964844, 0.33675384521484375, 0.3517951965332031, 0.3668365478515625, 0.3818778991699219, 0.39691925048828125, 0.4119606018066406, 0.427001953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 4.0, 10.0, 11.0, 6.0, 6.0, 7.0, 15.0, 23.0, 31.0, 115.0, 420.0, 172.0, 48.0, 25.0, 10.0, 12.0, 10.0, 4.0, 8.0, 10.0, 4.0, 7.0, 8.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.307861328125, -0.297821044921875, -0.28778076171875, -0.277740478515625, -0.2677001953125, -0.257659912109375, -0.24761962890625, -0.237579345703125, -0.2275390625, -0.217498779296875, -0.20745849609375, -0.197418212890625, -0.1873779296875, -0.177337646484375, -0.16729736328125, -0.157257080078125, -0.147216796875, -0.137176513671875, -0.12713623046875, -0.117095947265625, -0.1070556640625, -0.097015380859375, -0.08697509765625, -0.076934814453125, -0.06689453125, -0.056854248046875, -0.04681396484375, -0.036773681640625, -0.0267333984375, -0.016693115234375, -0.00665283203125, 0.003387451171875, 0.013427734375, 0.023468017578125, 0.03350830078125, 0.043548583984375, 0.0535888671875, 0.063629150390625, 0.07366943359375, 0.083709716796875, 0.09375, 0.103790283203125, 0.11383056640625, 0.123870849609375, 0.1339111328125, 0.143951416015625, 0.15399169921875, 0.164031982421875, 0.174072265625, 0.184112548828125, 0.19415283203125, 0.204193115234375, 0.2142333984375, 0.224273681640625, 0.23431396484375, 0.244354248046875, 0.25439453125, 0.264434814453125, 0.27447509765625, 0.284515380859375, 0.2945556640625, 0.304595947265625, 0.31463623046875, 0.324676513671875, 0.334716796875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 18.0, 75.0, 472.0, 361.0, 67.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8925241231918335, -1.7027668952941895, -1.5130096673965454, -1.3232524394989014, -1.1334953308105469, -0.9437380433082581, -0.7539808750152588, -0.5642236471176147, -0.3744664192199707, -0.18470920622348785, 0.005048006772994995, 0.19480520486831665, 0.3845624327659607, 0.5743196606636047, 0.764076828956604, 0.953834056854248, 1.143591284751892, 1.3333485126495361, 1.5231057405471802, 1.7128629684448242, 1.9026200771331787, 2.0923774242401123, 2.282134532928467, 2.4718918800354004, 2.661648988723755, 2.8514060974121094, 3.041163444519043, 3.2309205532073975, 3.420677900314331, 3.6104350090026855, 3.800192356109619, 3.9899494647979736, 4.179707050323486, 4.36946439743042, 4.559221267700195, 4.748978614807129, 4.9387359619140625, 5.128493309020996, 5.3182501792907715, 5.508007526397705, 5.697764873504639, 5.887522220611572, 6.077279090881348, 6.267036437988281, 6.456793785095215, 6.646551132202148, 6.836308002471924, 7.026065349578857, 7.215822219848633, 7.405579566955566, 7.595336437225342, 7.785093784332275, 7.974851131439209, 8.164608001708984, 8.354365348815918, 8.544122695922852, 8.733880043029785, 8.923637390136719, 9.113394737243652, 9.303152084350586, 9.492908477783203, 9.682665824890137, 9.87242317199707, 10.062180519104004, 10.251937866210938]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 6.0, 8.0, 15.0, 12.0, 11.0, 13.0, 21.0, 18.0, 30.0, 26.0, 35.0, 37.0, 39.0, 48.0, 46.0, 43.0, 47.0, 60.0, 61.0, 51.0, 45.0, 39.0, 43.0, 37.0, 37.0, 26.0, 29.0, 17.0, 23.0, 13.0, 18.0, 10.0, 7.0, 5.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8509693145751953, -0.8158197402954102, -0.7806701064109802, -0.7455205321311951, -0.7103708982467651, -0.67522132396698, -0.6400717496871948, -0.6049221754074097, -0.5697725415229797, -0.5346229672431946, -0.49947333335876465, -0.4643237590789795, -0.42917415499687195, -0.3940245509147644, -0.35887497663497925, -0.3237253725528717, -0.28857576847076416, -0.2534261643886566, -0.21827657520771027, -0.18312698602676392, -0.14797738194465637, -0.11282777786254883, -0.07767818868160248, -0.04252859950065613, -0.007378995418548584, 0.027770601212978363, 0.06292019784450531, 0.09806979447603226, 0.1332193911075592, 0.16836899518966675, 0.2035185843706131, 0.23866817355155945, 0.27381789684295654, 0.3089675009250641, 0.34411710500717163, 0.3792666792869568, 0.41441628336906433, 0.4495658874511719, 0.48471546173095703, 0.5198650360107422, 0.5550146698951721, 0.5901642441749573, 0.6253138780593872, 0.6604634523391724, 0.6956130266189575, 0.7307626605033875, 0.7659122347831726, 0.8010618686676025, 0.8362114429473877, 0.8713610172271729, 0.9065106511116028, 0.9416602253913879, 0.9768098592758179, 1.011959433555603, 1.0471090078353882, 1.0822585821151733, 1.117408275604248, 1.1525578498840332, 1.1877074241638184, 1.222857117652893, 1.2580066919326782, 1.2931562662124634, 1.3283058404922485, 1.3634554147720337, 1.3986049890518188]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 9.0, 12.0, 11.0, 12.0, 11.0, 19.0, 33.0, 56.0, 59.0, 100.0, 129.0, 211.0, 360.0, 674.0, 1549.0, 3857.0, 14757.0, 140030.0, 3978899.0, 40990.0, 7699.0, 2391.0, 1021.0, 539.0, 296.0, 175.0, 104.0, 96.0, 58.0, 27.0, 25.0, 14.0, 11.0, 10.0, 10.0, 13.0, 1.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.56640625, -0.5463790893554688, -0.5263519287109375, -0.5063247680664062, -0.486297607421875, -0.46627044677734375, -0.4462432861328125, -0.42621612548828125, -0.40618896484375, -0.38616180419921875, -0.3661346435546875, -0.34610748291015625, -0.326080322265625, -0.30605316162109375, -0.2860260009765625, -0.26599884033203125, -0.2459716796875, -0.22594451904296875, -0.2059173583984375, -0.18589019775390625, -0.165863037109375, -0.14583587646484375, -0.1258087158203125, -0.10578155517578125, -0.08575439453125, -0.06572723388671875, -0.0457000732421875, -0.02567291259765625, -0.005645751953125, 0.01438140869140625, 0.0344085693359375, 0.05443572998046875, 0.074462890625, 0.09449005126953125, 0.1145172119140625, 0.13454437255859375, 0.154571533203125, 0.17459869384765625, 0.1946258544921875, 0.21465301513671875, 0.23468017578125, 0.25470733642578125, 0.2747344970703125, 0.29476165771484375, 0.314788818359375, 0.33481597900390625, 0.3548431396484375, 0.37487030029296875, 0.3948974609375, 0.41492462158203125, 0.4349517822265625, 0.45497894287109375, 0.475006103515625, 0.49503326416015625, 0.5150604248046875, 0.5350875854492188, 0.55511474609375, 0.5751419067382812, 0.5951690673828125, 0.6151962280273438, 0.635223388671875, 0.6552505493164062, 0.6752777099609375, 0.6953048706054688, 0.71533203125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 1.0, 8.0, 5.0, 13.0, 11.0, 13.0, 17.0, 18.0, 20.0, 35.0, 29.0, 37.0, 48.0, 42.0, 50.0, 49.0, 63.0, 61.0, 55.0, 52.0, 56.0, 39.0, 31.0, 29.0, 40.0, 30.0, 16.0, 26.0, 15.0, 15.0, 18.0, 9.0, 7.0, 11.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06427001953125, -0.062091827392578125, -0.05991363525390625, -0.057735443115234375, -0.0555572509765625, -0.053379058837890625, -0.05120086669921875, -0.049022674560546875, -0.046844482421875, -0.044666290283203125, -0.04248809814453125, -0.040309906005859375, -0.0381317138671875, -0.035953521728515625, -0.03377532958984375, -0.031597137451171875, -0.0294189453125, -0.027240753173828125, -0.02506256103515625, -0.022884368896484375, -0.0207061767578125, -0.018527984619140625, -0.01634979248046875, -0.014171600341796875, -0.011993408203125, -0.009815216064453125, -0.00763702392578125, -0.005458831787109375, -0.0032806396484375, -0.001102447509765625, 0.00107574462890625, 0.003253936767578125, 0.00543212890625, 0.007610321044921875, 0.00978851318359375, 0.011966705322265625, 0.0141448974609375, 0.016323089599609375, 0.01850128173828125, 0.020679473876953125, 0.022857666015625, 0.025035858154296875, 0.02721405029296875, 0.029392242431640625, 0.0315704345703125, 0.033748626708984375, 0.03592681884765625, 0.038105010986328125, 0.040283203125, 0.042461395263671875, 0.04463958740234375, 0.046817779541015625, 0.0489959716796875, 0.051174163818359375, 0.05335235595703125, 0.055530548095703125, 0.057708740234375, 0.059886932373046875, 0.06206512451171875, 0.06424331665039062, 0.0664215087890625, 0.06859970092773438, 0.07077789306640625, 0.07295608520507812, 0.07513427734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 10.0, 10.0, 5.0, 13.0, 26.0, 33.0, 110.0, 220.0, 662.0, 2828.0, 25719.0, 3965466.0, 188124.0, 8961.0, 1407.0, 389.0, 134.0, 66.0, 33.0, 21.0, 14.0, 11.0, 8.0, 4.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.8168792724609375, -0.791961669921875, -0.7670440673828125, -0.74212646484375, -0.7172088623046875, -0.692291259765625, -0.6673736572265625, -0.6424560546875, -0.6175384521484375, -0.592620849609375, -0.5677032470703125, -0.54278564453125, -0.5178680419921875, -0.492950439453125, -0.4680328369140625, -0.443115234375, -0.4181976318359375, -0.393280029296875, -0.3683624267578125, -0.34344482421875, -0.3185272216796875, -0.293609619140625, -0.2686920166015625, -0.2437744140625, -0.2188568115234375, -0.193939208984375, -0.1690216064453125, -0.14410400390625, -0.1191864013671875, -0.094268798828125, -0.0693511962890625, -0.04443359375, -0.0195159912109375, 0.005401611328125, 0.0303192138671875, 0.05523681640625, 0.0801544189453125, 0.105072021484375, 0.1299896240234375, 0.1549072265625, 0.1798248291015625, 0.204742431640625, 0.2296600341796875, 0.25457763671875, 0.2794952392578125, 0.304412841796875, 0.3293304443359375, 0.354248046875, 0.3791656494140625, 0.404083251953125, 0.4290008544921875, 0.45391845703125, 0.4788360595703125, 0.503753662109375, 0.5286712646484375, 0.5535888671875, 0.5785064697265625, 0.603424072265625, 0.6283416748046875, 0.65325927734375, 0.6781768798828125, 0.703094482421875, 0.7280120849609375, 0.7529296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 7.0, 9.0, 12.0, 9.0, 14.0, 15.0, 29.0, 24.0, 32.0, 72.0, 82.0, 150.0, 734.0, 1956.0, 526.0, 130.0, 85.0, 39.0, 40.0, 28.0, 28.0, 10.0, 6.0, 14.0, 4.0, 7.0, 9.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1558837890625, -0.15076637268066406, -0.14564895629882812, -0.1405315399169922, -0.13541412353515625, -0.1302967071533203, -0.12517929077148438, -0.12006187438964844, -0.1149444580078125, -0.10982704162597656, -0.10470962524414062, -0.09959220886230469, -0.09447479248046875, -0.08935737609863281, -0.08423995971679688, -0.07912254333496094, -0.074005126953125, -0.06888771057128906, -0.06377029418945312, -0.05865287780761719, -0.05353546142578125, -0.04841804504394531, -0.043300628662109375, -0.03818321228027344, -0.0330657958984375, -0.027948379516601562, -0.022830963134765625, -0.017713546752929688, -0.01259613037109375, -0.0074787139892578125, -0.002361297607421875, 0.0027561187744140625, 0.00787353515625, 0.012990951538085938, 0.018108367919921875, 0.023225784301757812, 0.02834320068359375, 0.03346061706542969, 0.038578033447265625, 0.04369544982910156, 0.0488128662109375, 0.05393028259277344, 0.059047698974609375, 0.06416511535644531, 0.06928253173828125, 0.07439994812011719, 0.07951736450195312, 0.08463478088378906, 0.089752197265625, 0.09486961364746094, 0.09998703002929688, 0.10510444641113281, 0.11022186279296875, 0.11533927917480469, 0.12045669555664062, 0.12557411193847656, 0.1306915283203125, 0.13580894470214844, 0.14092636108398438, 0.1460437774658203, 0.15116119384765625, 0.1562786102294922, 0.16139602661132812, 0.16651344299316406, 0.171630859375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 11.0, 19.0, 36.0, 63.0, 83.0, 151.0, 177.0, 168.0, 112.0, 71.0, 33.0, 30.0, 16.0, 17.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2656150460243225, -0.25055819749832153, -0.23550133407115936, -0.2204444706439972, -0.20538762211799622, -0.19033077359199524, -0.17527391016483307, -0.1602170467376709, -0.14516019821166992, -0.13010334968566895, -0.11504648625850677, -0.0999896302819252, -0.08493277430534363, -0.06987591832876205, -0.05481906235218048, -0.03976220637559891, -0.024705350399017334, -0.00964849442243576, 0.005408361554145813, 0.020465217530727386, 0.03552207350730896, 0.05057892948389053, 0.0656357854604721, 0.08069264143705368, 0.09574949741363525, 0.11080635339021683, 0.1258632093667984, 0.14092007279396057, 0.15597692131996155, 0.17103376984596252, 0.1860906332731247, 0.20114749670028687, 0.21620434522628784, 0.23126119375228882, 0.246318057179451, 0.26137492060661316, 0.27643176913261414, 0.2914886176586151, 0.3065454959869385, 0.32160234451293945, 0.33665919303894043, 0.3517160415649414, 0.3667728900909424, 0.38182976841926575, 0.3968866169452667, 0.4119434654712677, 0.42700034379959106, 0.44205719232559204, 0.457114040851593, 0.472170889377594, 0.48722773790359497, 0.502284586429596, 0.5173414945602417, 0.5323983430862427, 0.5474551916122437, 0.5625120401382446, 0.5775688886642456, 0.5926257371902466, 0.6076825857162476, 0.6227394342422485, 0.6377962827682495, 0.6528531908988953, 0.6679100394248962, 0.6829668879508972, 0.6980237364768982]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 9.0, 5.0, 7.0, 8.0, 19.0, 19.0, 30.0, 37.0, 26.0, 47.0, 48.0, 52.0, 58.0, 67.0, 49.0, 60.0, 58.0, 51.0, 56.0, 43.0, 56.0, 31.0, 41.0, 19.0, 25.0, 20.0, 8.0, 19.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.5101990103721619, -0.49831050634384155, -0.48642200231552124, -0.4745334982872009, -0.4626449942588806, -0.4507564902305603, -0.43886798620224, -0.4269794821739197, -0.41509097814559937, -0.40320247411727905, -0.39131397008895874, -0.3794254660606384, -0.3675369620323181, -0.3556484580039978, -0.3437599539756775, -0.3318714499473572, -0.31998294591903687, -0.30809444189071655, -0.29620593786239624, -0.2843174338340759, -0.2724289298057556, -0.2605404257774353, -0.248651921749115, -0.23676341772079468, -0.22487488389015198, -0.21298637986183167, -0.20109787583351135, -0.18920937180519104, -0.17732086777687073, -0.16543236374855042, -0.1535438597202301, -0.1416553556919098, -0.12976685166358948, -0.11787834763526917, -0.10598984360694885, -0.09410133957862854, -0.08221283555030823, -0.07032433152198792, -0.058435820043087006, -0.04654731601476669, -0.03465881198644638, -0.022770307958126068, -0.010881802067160606, 0.0010067038238048553, 0.012895207852125168, 0.02478371188044548, 0.03667221963405609, 0.048560723662376404, 0.060449227690696716, 0.07233773171901703, 0.08422623574733734, 0.09611473977565765, 0.10800324380397797, 0.11989174783229828, 0.13178026676177979, 0.1436687707901001, 0.1555572748184204, 0.16744577884674072, 0.17933428287506104, 0.19122278690338135, 0.20311129093170166, 0.21499979496002197, 0.22688829898834229, 0.2387768030166626, 0.2506653070449829]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 9.0, 13.0, 19.0, 24.0, 44.0, 73.0, 83.0, 124.0, 198.0, 310.0, 488.0, 733.0, 1113.0, 1714.0, 2804.0, 4645.0, 7836.0, 13278.0, 23440.0, 44007.0, 89685.0, 214688.0, 340536.0, 152903.0, 68181.0, 34784.0, 19228.0, 10849.0, 6404.0, 3859.0, 2214.0, 1453.0, 943.0, 618.0, 438.0, 276.0, 174.0, 135.0, 85.0, 54.0, 36.0, 22.0, 12.0, 5.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.257568359375, -0.2500629425048828, -0.24255752563476562, -0.23505210876464844, -0.22754669189453125, -0.22004127502441406, -0.21253585815429688, -0.2050304412841797, -0.1975250244140625, -0.1900196075439453, -0.18251419067382812, -0.17500877380371094, -0.16750335693359375, -0.15999794006347656, -0.15249252319335938, -0.1449871063232422, -0.137481689453125, -0.1299762725830078, -0.12247085571289062, -0.11496543884277344, -0.10746002197265625, -0.09995460510253906, -0.09244918823242188, -0.08494377136230469, -0.0774383544921875, -0.06993293762207031, -0.062427520751953125, -0.05492210388183594, -0.04741668701171875, -0.03991127014160156, -0.032405853271484375, -0.024900436401367188, -0.01739501953125, -0.009889602661132812, -0.002384185791015625, 0.0051212310791015625, 0.01262664794921875, 0.020132064819335938, 0.027637481689453125, 0.03514289855957031, 0.0426483154296875, 0.05015373229980469, 0.057659149169921875, 0.06516456604003906, 0.07266998291015625, 0.08017539978027344, 0.08768081665039062, 0.09518623352050781, 0.102691650390625, 0.11019706726074219, 0.11770248413085938, 0.12520790100097656, 0.13271331787109375, 0.14021873474121094, 0.14772415161132812, 0.1552295684814453, 0.1627349853515625, 0.1702404022216797, 0.17774581909179688, 0.18525123596191406, 0.19275665283203125, 0.20026206970214844, 0.20776748657226562, 0.2152729034423828, 0.2227783203125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 7.0, 10.0, 12.0, 24.0, 19.0, 18.0, 32.0, 27.0, 34.0, 45.0, 45.0, 52.0, 55.0, 47.0, 67.0, 53.0, 59.0, 45.0, 40.0, 51.0, 27.0, 30.0, 30.0, 19.0, 24.0, 22.0, 17.0, 14.0, 11.0, 13.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06207275390625, -0.05997943878173828, -0.05788612365722656, -0.055792808532714844, -0.053699493408203125, -0.051606178283691406, -0.04951286315917969, -0.04741954803466797, -0.04532623291015625, -0.04323291778564453, -0.04113960266113281, -0.039046287536621094, -0.036952972412109375, -0.034859657287597656, -0.03276634216308594, -0.03067302703857422, -0.0285797119140625, -0.02648639678955078, -0.024393081665039062, -0.022299766540527344, -0.020206451416015625, -0.018113136291503906, -0.016019821166992188, -0.013926506042480469, -0.01183319091796875, -0.009739875793457031, -0.0076465606689453125, -0.005553245544433594, -0.003459930419921875, -0.0013666152954101562, 0.0007266998291015625, 0.0028200149536132812, 0.004913330078125, 0.007006645202636719, 0.009099960327148438, 0.011193275451660156, 0.013286590576171875, 0.015379905700683594, 0.017473220825195312, 0.01956653594970703, 0.02165985107421875, 0.02375316619873047, 0.025846481323242188, 0.027939796447753906, 0.030033111572265625, 0.032126426696777344, 0.03421974182128906, 0.03631305694580078, 0.0384063720703125, 0.04049968719482422, 0.04259300231933594, 0.044686317443847656, 0.046779632568359375, 0.048872947692871094, 0.05096626281738281, 0.05305957794189453, 0.05515289306640625, 0.05724620819091797, 0.05933952331542969, 0.061432838439941406, 0.06352615356445312, 0.06561946868896484, 0.06771278381347656, 0.06980609893798828, 0.0718994140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 9.0, 11.0, 10.0, 15.0, 15.0, 18.0, 29.0, 41.0, 64.0, 69.0, 116.0, 147.0, 239.0, 428.0, 877.0, 2224.0, 6607.0, 24475.0, 119413.0, 672321.0, 176058.0, 31846.0, 8476.0, 2646.0, 1048.0, 519.0, 261.0, 172.0, 90.0, 80.0, 41.0, 43.0, 36.0, 25.0, 17.0, 10.0, 10.0, 14.0, 2.0, 6.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.491455078125, -0.4748497009277344, -0.45824432373046875, -0.4416389465332031, -0.4250335693359375, -0.4084281921386719, -0.39182281494140625, -0.3752174377441406, -0.358612060546875, -0.3420066833496094, -0.32540130615234375, -0.3087959289550781, -0.2921905517578125, -0.2755851745605469, -0.25897979736328125, -0.24237442016601562, -0.22576904296875, -0.20916366577148438, -0.19255828857421875, -0.17595291137695312, -0.1593475341796875, -0.14274215698242188, -0.12613677978515625, -0.10953140258789062, -0.092926025390625, -0.07632064819335938, -0.05971527099609375, -0.043109893798828125, -0.0265045166015625, -0.009899139404296875, 0.00670623779296875, 0.023311614990234375, 0.0399169921875, 0.056522369384765625, 0.07312774658203125, 0.08973312377929688, 0.1063385009765625, 0.12294387817382812, 0.13954925537109375, 0.15615463256835938, 0.172760009765625, 0.18936538696289062, 0.20597076416015625, 0.22257614135742188, 0.2391815185546875, 0.2557868957519531, 0.27239227294921875, 0.2889976501464844, 0.30560302734375, 0.3222084045410156, 0.33881378173828125, 0.3554191589355469, 0.3720245361328125, 0.3886299133300781, 0.40523529052734375, 0.4218406677246094, 0.438446044921875, 0.4550514221191406, 0.47165679931640625, 0.4882621765136719, 0.5048675537109375, 0.5214729309082031, 0.5380783081054688, 0.5546836853027344, 0.5712890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 11.0, 4.0, 15.0, 14.0, 15.0, 18.0, 20.0, 19.0, 18.0, 31.0, 23.0, 27.0, 28.0, 43.0, 43.0, 36.0, 55.0, 41.0, 37.0, 58.0, 45.0, 51.0, 38.0, 46.0, 38.0, 29.0, 24.0, 29.0, 17.0, 24.0, 13.0, 15.0, 12.0, 11.0, 8.0, 7.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1558837890625, -0.15110206604003906, -0.14632034301757812, -0.1415386199951172, -0.13675689697265625, -0.1319751739501953, -0.12719345092773438, -0.12241172790527344, -0.1176300048828125, -0.11284828186035156, -0.10806655883789062, -0.10328483581542969, -0.09850311279296875, -0.09372138977050781, -0.08893966674804688, -0.08415794372558594, -0.079376220703125, -0.07459449768066406, -0.06981277465820312, -0.06503105163574219, -0.06024932861328125, -0.05546760559082031, -0.050685882568359375, -0.04590415954589844, -0.0411224365234375, -0.03634071350097656, -0.031558990478515625, -0.026777267456054688, -0.02199554443359375, -0.017213821411132812, -0.012432098388671875, -0.0076503753662109375, -0.00286865234375, 0.0019130706787109375, 0.006694793701171875, 0.011476516723632812, 0.01625823974609375, 0.021039962768554688, 0.025821685791015625, 0.030603408813476562, 0.0353851318359375, 0.04016685485839844, 0.044948577880859375, 0.04973030090332031, 0.05451202392578125, 0.05929374694824219, 0.06407546997070312, 0.06885719299316406, 0.073638916015625, 0.07842063903808594, 0.08320236206054688, 0.08798408508300781, 0.09276580810546875, 0.09754753112792969, 0.10232925415039062, 0.10711097717285156, 0.1118927001953125, 0.11667442321777344, 0.12145614624023438, 0.1262378692626953, 0.13101959228515625, 0.1358013153076172, 0.14058303833007812, 0.14536476135253906, 0.150146484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 5.0, 12.0, 17.0, 20.0, 33.0, 43.0, 70.0, 142.0, 260.0, 606.0, 2062.0, 7773.0, 47986.0, 791225.0, 175400.0, 17276.0, 3692.0, 1091.0, 383.0, 182.0, 90.0, 63.0, 31.0, 28.0, 12.0, 12.0, 6.0, 7.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2486572265625, -0.23935890197753906, -0.23006057739257812, -0.2207622528076172, -0.21146392822265625, -0.2021656036376953, -0.19286727905273438, -0.18356895446777344, -0.1742706298828125, -0.16497230529785156, -0.15567398071289062, -0.1463756561279297, -0.13707733154296875, -0.1277790069580078, -0.11848068237304688, -0.10918235778808594, -0.099884033203125, -0.09058570861816406, -0.08128738403320312, -0.07198905944824219, -0.06269073486328125, -0.05339241027832031, -0.044094085693359375, -0.03479576110839844, -0.0254974365234375, -0.016199111938476562, -0.006900787353515625, 0.0023975372314453125, 0.01169586181640625, 0.020994186401367188, 0.030292510986328125, 0.03959083557128906, 0.04888916015625, 0.05818748474121094, 0.06748580932617188, 0.07678413391113281, 0.08608245849609375, 0.09538078308105469, 0.10467910766601562, 0.11397743225097656, 0.1232757568359375, 0.13257408142089844, 0.14187240600585938, 0.1511707305908203, 0.16046905517578125, 0.1697673797607422, 0.17906570434570312, 0.18836402893066406, 0.197662353515625, 0.20696067810058594, 0.21625900268554688, 0.2255573272705078, 0.23485565185546875, 0.2441539764404297, 0.2534523010253906, 0.26275062561035156, 0.2720489501953125, 0.28134727478027344, 0.2906455993652344, 0.2999439239501953, 0.30924224853515625, 0.3185405731201172, 0.3278388977050781, 0.33713722229003906, 0.346435546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 14.0, 12.0, 16.0, 13.0, 29.0, 30.0, 44.0, 61.0, 78.0, 137.0, 159.0, 123.0, 75.0, 48.0, 37.0, 26.0, 22.0, 10.0, 14.0, 11.0, 7.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.74913215637207e-05, -3.62154096364975e-05, -3.493949770927429e-05, -3.3663585782051086e-05, -3.238767385482788e-05, -3.1111761927604675e-05, -2.983585000038147e-05, -2.8559938073158264e-05, -2.728402614593506e-05, -2.6008114218711853e-05, -2.4732202291488647e-05, -2.3456290364265442e-05, -2.2180378437042236e-05, -2.090446650981903e-05, -1.9628554582595825e-05, -1.835264265537262e-05, -1.7076730728149414e-05, -1.580081880092621e-05, -1.4524906873703003e-05, -1.3248994946479797e-05, -1.1973083019256592e-05, -1.0697171092033386e-05, -9.42125916481018e-06, -8.145347237586975e-06, -6.8694353103637695e-06, -5.593523383140564e-06, -4.317611455917358e-06, -3.041699528694153e-06, -1.7657876014709473e-06, -4.898756742477417e-07, 7.860362529754639e-07, 2.0619481801986694e-06, 3.337860107421875e-06, 4.6137720346450806e-06, 5.889683961868286e-06, 7.165595889091492e-06, 8.441507816314697e-06, 9.717419743537903e-06, 1.0993331670761108e-05, 1.2269243597984314e-05, 1.354515552520752e-05, 1.4821067452430725e-05, 1.609697937965393e-05, 1.7372891306877136e-05, 1.8648803234100342e-05, 1.9924715161323547e-05, 2.1200627088546753e-05, 2.247653901576996e-05, 2.3752450942993164e-05, 2.502836287021637e-05, 2.6304274797439575e-05, 2.758018672466278e-05, 2.8856098651885986e-05, 3.0132010579109192e-05, 3.14079225063324e-05, 3.26838344335556e-05, 3.395974636077881e-05, 3.5235658288002014e-05, 3.651157021522522e-05, 3.7787482142448425e-05, 3.906339406967163e-05, 4.0339305996894836e-05, 4.161521792411804e-05, 4.289112985134125e-05, 4.416704177856445e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 11.0, 11.0, 23.0, 47.0, 67.0, 126.0, 230.0, 467.0, 1169.0, 3235.0, 13758.0, 121509.0, 846605.0, 49586.0, 7859.0, 2172.0, 848.0, 372.0, 179.0, 101.0, 64.0, 30.0, 26.0, 12.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1939697265625, -0.18712234497070312, -0.18027496337890625, -0.17342758178710938, -0.1665802001953125, -0.15973281860351562, -0.15288543701171875, -0.14603805541992188, -0.139190673828125, -0.13234329223632812, -0.12549591064453125, -0.11864852905273438, -0.1118011474609375, -0.10495376586914062, -0.09810638427734375, -0.09125900268554688, -0.08441162109375, -0.07756423950195312, -0.07071685791015625, -0.06386947631835938, -0.0570220947265625, -0.050174713134765625, -0.04332733154296875, -0.036479949951171875, -0.029632568359375, -0.022785186767578125, -0.01593780517578125, -0.009090423583984375, -0.0022430419921875, 0.004604339599609375, 0.01145172119140625, 0.018299102783203125, 0.025146484375, 0.031993865966796875, 0.03884124755859375, 0.045688629150390625, 0.0525360107421875, 0.059383392333984375, 0.06623077392578125, 0.07307815551757812, 0.079925537109375, 0.08677291870117188, 0.09362030029296875, 0.10046768188476562, 0.1073150634765625, 0.11416244506835938, 0.12100982666015625, 0.12785720825195312, 0.13470458984375, 0.14155197143554688, 0.14839935302734375, 0.15524673461914062, 0.1620941162109375, 0.16894149780273438, 0.17578887939453125, 0.18263626098632812, 0.189483642578125, 0.19633102416992188, 0.20317840576171875, 0.21002578735351562, 0.2168731689453125, 0.22372055053710938, 0.23056793212890625, 0.23741531372070312, 0.2442626953125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 12.0, 14.0, 22.0, 33.0, 53.0, 57.0, 109.0, 170.0, 191.0, 106.0, 70.0, 44.0, 27.0, 19.0, 25.0, 9.0, 7.0, 5.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0843505859375, -0.0817117691040039, -0.07907295227050781, -0.07643413543701172, -0.07379531860351562, -0.07115650177001953, -0.06851768493652344, -0.06587886810302734, -0.06324005126953125, -0.060601234436035156, -0.05796241760253906, -0.05532360076904297, -0.052684783935546875, -0.05004596710205078, -0.04740715026855469, -0.044768333435058594, -0.0421295166015625, -0.039490699768066406, -0.03685188293457031, -0.03421306610107422, -0.031574249267578125, -0.02893543243408203, -0.026296615600585938, -0.023657798767089844, -0.02101898193359375, -0.018380165100097656, -0.015741348266601562, -0.013102531433105469, -0.010463714599609375, -0.007824897766113281, -0.0051860809326171875, -0.0025472640991210938, 9.1552734375e-05, 0.0027303695678710938, 0.0053691864013671875, 0.008008003234863281, 0.010646820068359375, 0.013285636901855469, 0.015924453735351562, 0.018563270568847656, 0.02120208740234375, 0.023840904235839844, 0.026479721069335938, 0.02911853790283203, 0.031757354736328125, 0.03439617156982422, 0.03703498840332031, 0.039673805236816406, 0.0423126220703125, 0.044951438903808594, 0.04759025573730469, 0.05022907257080078, 0.052867889404296875, 0.05550670623779297, 0.05814552307128906, 0.060784339904785156, 0.06342315673828125, 0.06606197357177734, 0.06870079040527344, 0.07133960723876953, 0.07397842407226562, 0.07661724090576172, 0.07925605773925781, 0.0818948745727539, 0.08453369140625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 40.0, 311.0, 530.0, 105.0, 21.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6719133853912354, -0.5430411100387573, -0.4141687750816345, -0.2852964699268341, -0.1564241647720337, -0.027551889419555664, 0.10132044553756714, 0.23019278049468994, 0.35906505584716797, 0.4879373610019684, 0.6168096661567688, 0.7456820011138916, 0.8745542764663696, 1.0034265518188477, 1.1322989463806152, 1.2611712217330933, 1.3900434970855713, 1.5189157724380493, 1.6477880477905273, 1.776660442352295, 1.905532717704773, 2.034404993057251, 2.1632773876190186, 2.292149543762207, 2.4210219383239746, 2.549894332885742, 2.6787664890289307, 2.8076388835906982, 2.9365110397338867, 3.0653834342956543, 3.194255828857422, 3.3231282234191895, 3.452000617980957, 3.5808730125427246, 3.709745168685913, 3.8386175632476807, 3.967489719390869, 4.096362113952637, 4.225234508514404, 4.354106903076172, 4.482978820800781, 4.611851215362549, 4.740723609924316, 4.869595527648926, 4.998467922210693, 5.127340316772461, 5.2562127113342285, 5.385085105895996, 5.513957500457764, 5.642829895019531, 5.771702289581299, 5.900574207305908, 6.029446601867676, 6.158318996429443, 6.287191390991211, 6.4160637855529785, 6.544936180114746, 6.673808574676514, 6.802680969238281, 6.931552886962891, 7.060425281524658, 7.189297676086426, 7.318170070648193, 7.447042465209961, 7.57591438293457]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 1.0, 5.0, 8.0, 13.0, 13.0, 11.0, 22.0, 19.0, 21.0, 22.0, 31.0, 39.0, 30.0, 45.0, 32.0, 42.0, 34.0, 41.0, 46.0, 39.0, 52.0, 33.0, 49.0, 50.0, 39.0, 39.0, 32.0, 24.0, 28.0, 20.0, 21.0, 16.0, 16.0, 11.0, 13.0, 10.0, 8.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5708951950073242, -0.5520833730697632, -0.5332715511322021, -0.5144597291946411, -0.4956478774547577, -0.47683605551719666, -0.45802420377731323, -0.4392123818397522, -0.42040055990219116, -0.4015887379646301, -0.3827769160270691, -0.36396506428718567, -0.34515324234962463, -0.3263414204120636, -0.3075295686721802, -0.28871774673461914, -0.2699059247970581, -0.25109410285949707, -0.23228226602077484, -0.2134704291820526, -0.19465860724449158, -0.17584678530693054, -0.1570349484682083, -0.13822311162948608, -0.11941128969192505, -0.10059946030378342, -0.08178763091564178, -0.06297580152750015, -0.04416397213935852, -0.02535214275121689, -0.006540313363075256, 0.012271523475646973, 0.031083285808563232, 0.049895115196704865, 0.0687069445848465, 0.08751877397298813, 0.10633060336112976, 0.1251424252986908, 0.14395426213741302, 0.16276609897613525, 0.1815779209136963, 0.20038974285125732, 0.21920157968997955, 0.23801341652870178, 0.2568252384662628, 0.27563706040382385, 0.2944489121437073, 0.3132607340812683, 0.33207255601882935, 0.3508843779563904, 0.3696961998939514, 0.38850805163383484, 0.4073198735713959, 0.4261316955089569, 0.44494354724884033, 0.46375536918640137, 0.4825671911239624, 0.5013790130615234, 0.5201908349990845, 0.5390026569366455, 0.5578144788742065, 0.5766263604164124, 0.5954381823539734, 0.6142500042915344, 0.6330618262290955]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 7.0, 3.0, 6.0, 13.0, 10.0, 7.0, 18.0, 22.0, 26.0, 37.0, 39.0, 52.0, 72.0, 101.0, 148.0, 184.0, 303.0, 474.0, 893.0, 2257.0, 8322.0, 64143.0, 4003748.0, 98310.0, 10126.0, 2509.0, 904.0, 481.0, 332.0, 222.0, 133.0, 92.0, 60.0, 53.0, 48.0, 25.0, 28.0, 20.0, 13.0, 10.0, 7.0, 9.0, 5.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.720703125, -0.6978759765625, -0.675048828125, -0.6522216796875, -0.62939453125, -0.6065673828125, -0.583740234375, -0.5609130859375, -0.5380859375, -0.5152587890625, -0.492431640625, -0.4696044921875, -0.44677734375, -0.4239501953125, -0.401123046875, -0.3782958984375, -0.35546875, -0.3326416015625, -0.309814453125, -0.2869873046875, -0.26416015625, -0.2413330078125, -0.218505859375, -0.1956787109375, -0.1728515625, -0.1500244140625, -0.127197265625, -0.1043701171875, -0.08154296875, -0.0587158203125, -0.035888671875, -0.0130615234375, 0.009765625, 0.0325927734375, 0.055419921875, 0.0782470703125, 0.10107421875, 0.1239013671875, 0.146728515625, 0.1695556640625, 0.1923828125, 0.2152099609375, 0.238037109375, 0.2608642578125, 0.28369140625, 0.3065185546875, 0.329345703125, 0.3521728515625, 0.375, 0.3978271484375, 0.420654296875, 0.4434814453125, 0.46630859375, 0.4891357421875, 0.511962890625, 0.5347900390625, 0.5576171875, 0.5804443359375, 0.603271484375, 0.6260986328125, 0.64892578125, 0.6717529296875, 0.694580078125, 0.7174072265625, 0.740234375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 7.0, 4.0, 10.0, 3.0, 6.0, 8.0, 12.0, 9.0, 13.0, 19.0, 26.0, 17.0, 28.0, 34.0, 30.0, 46.0, 39.0, 54.0, 55.0, 55.0, 53.0, 46.0, 51.0, 45.0, 37.0, 45.0, 37.0, 36.0, 30.0, 28.0, 27.0, 14.0, 16.0, 13.0, 8.0, 7.0, 10.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.072265625, -0.0701742172241211, -0.06808280944824219, -0.06599140167236328, -0.06389999389648438, -0.06180858612060547, -0.05971717834472656, -0.057625770568847656, -0.05553436279296875, -0.053442955017089844, -0.05135154724121094, -0.04926013946533203, -0.047168731689453125, -0.04507732391357422, -0.04298591613769531, -0.040894508361816406, -0.0388031005859375, -0.036711692810058594, -0.03462028503417969, -0.03252887725830078, -0.030437469482421875, -0.02834606170654297, -0.026254653930664062, -0.024163246154785156, -0.02207183837890625, -0.019980430603027344, -0.017889022827148438, -0.01579761505126953, -0.013706207275390625, -0.011614799499511719, -0.009523391723632812, -0.007431983947753906, -0.005340576171875, -0.0032491683959960938, -0.0011577606201171875, 0.0009336471557617188, 0.003025054931640625, 0.005116462707519531, 0.0072078704833984375, 0.009299278259277344, 0.01139068603515625, 0.013482093811035156, 0.015573501586914062, 0.01766490936279297, 0.019756317138671875, 0.02184772491455078, 0.023939132690429688, 0.026030540466308594, 0.0281219482421875, 0.030213356018066406, 0.03230476379394531, 0.03439617156982422, 0.036487579345703125, 0.03857898712158203, 0.04067039489746094, 0.042761802673339844, 0.04485321044921875, 0.046944618225097656, 0.04903602600097656, 0.05112743377685547, 0.053218841552734375, 0.05531024932861328, 0.05740165710449219, 0.059493064880371094, 0.06158447265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 1.0, 2.0, 6.0, 5.0, 8.0, 11.0, 14.0, 27.0, 32.0, 38.0, 62.0, 122.0, 270.0, 693.0, 2043.0, 7831.0, 40599.0, 547311.0, 3490343.0, 86114.0, 13709.0, 3320.0, 955.0, 367.0, 160.0, 83.0, 46.0, 37.0, 20.0, 12.0, 9.0, 10.0, 7.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58349609375, -0.5673713684082031, -0.5512466430664062, -0.5351219177246094, -0.5189971923828125, -0.5028724670410156, -0.48674774169921875, -0.4706230163574219, -0.454498291015625, -0.4383735656738281, -0.42224884033203125, -0.4061241149902344, -0.3899993896484375, -0.3738746643066406, -0.35774993896484375, -0.3416252136230469, -0.32550048828125, -0.3093757629394531, -0.29325103759765625, -0.2771263122558594, -0.2610015869140625, -0.24487686157226562, -0.22875213623046875, -0.21262741088867188, -0.196502685546875, -0.18037796020507812, -0.16425323486328125, -0.14812850952148438, -0.1320037841796875, -0.11587905883789062, -0.09975433349609375, -0.08362960815429688, -0.0675048828125, -0.051380157470703125, -0.03525543212890625, -0.019130706787109375, -0.0030059814453125, 0.013118743896484375, 0.02924346923828125, 0.045368194580078125, 0.061492919921875, 0.07761764526367188, 0.09374237060546875, 0.10986709594726562, 0.1259918212890625, 0.14211654663085938, 0.15824127197265625, 0.17436599731445312, 0.19049072265625, 0.20661544799804688, 0.22274017333984375, 0.23886489868164062, 0.2549896240234375, 0.2711143493652344, 0.28723907470703125, 0.3033638000488281, 0.319488525390625, 0.3356132507324219, 0.35173797607421875, 0.3678627014160156, 0.3839874267578125, 0.4001121520996094, 0.41623687744140625, 0.4323616027832031, 0.448486328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 6.0, 6.0, 11.0, 10.0, 10.0, 24.0, 17.0, 27.0, 28.0, 41.0, 55.0, 82.0, 117.0, 173.0, 423.0, 1269.0, 873.0, 316.0, 142.0, 124.0, 68.0, 42.0, 37.0, 27.0, 33.0, 27.0, 16.0, 18.0, 10.0, 9.0, 6.0, 6.0, 5.0, 6.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1444091796875, -0.13956642150878906, -0.13472366333007812, -0.1298809051513672, -0.12503814697265625, -0.12019538879394531, -0.11535263061523438, -0.11050987243652344, -0.1056671142578125, -0.10082435607910156, -0.09598159790039062, -0.09113883972167969, -0.08629608154296875, -0.08145332336425781, -0.07661056518554688, -0.07176780700683594, -0.066925048828125, -0.06208229064941406, -0.057239532470703125, -0.05239677429199219, -0.04755401611328125, -0.04271125793457031, -0.037868499755859375, -0.03302574157714844, -0.0281829833984375, -0.023340225219726562, -0.018497467041015625, -0.013654708862304688, -0.00881195068359375, -0.0039691925048828125, 0.000873565673828125, 0.0057163238525390625, 0.01055908203125, 0.015401840209960938, 0.020244598388671875, 0.025087356567382812, 0.02993011474609375, 0.03477287292480469, 0.039615631103515625, 0.04445838928222656, 0.0493011474609375, 0.05414390563964844, 0.058986663818359375, 0.06382942199707031, 0.06867218017578125, 0.07351493835449219, 0.07835769653320312, 0.08320045471191406, 0.088043212890625, 0.09288597106933594, 0.09772872924804688, 0.10257148742675781, 0.10741424560546875, 0.11225700378417969, 0.11709976196289062, 0.12194252014160156, 0.1267852783203125, 0.13162803649902344, 0.13647079467773438, 0.1413135528564453, 0.14615631103515625, 0.1509990692138672, 0.15584182739257812, 0.16068458557128906, 0.16552734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 10.0, 14.0, 25.0, 48.0, 57.0, 123.0, 180.0, 192.0, 120.0, 86.0, 51.0, 34.0, 25.0, 9.0, 11.0, 5.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34069955348968506, -0.31957659125328064, -0.2984536290168762, -0.2773306369781494, -0.256207674741745, -0.23508471250534058, -0.21396175026893616, -0.19283877313137054, -0.17171581089496613, -0.1505928486585617, -0.1294698715209961, -0.10834690928459167, -0.08722393959760666, -0.06610096991062164, -0.044978007674217224, -0.02385503053665161, -0.0027320683002471924, 0.018390899524092674, 0.03951386734843254, 0.06063683331012726, 0.08175980299711227, 0.10288277268409729, 0.12400573492050171, 0.14512871205806732, 0.16625167429447174, 0.18737463653087616, 0.20849761366844177, 0.2296205759048462, 0.2507435381412506, 0.27186650037765503, 0.29298949241638184, 0.31411245465278625, 0.3352354168891907, 0.3563583791255951, 0.3774813413619995, 0.3986043334007263, 0.41972729563713074, 0.44085025787353516, 0.4619732201099396, 0.483096182346344, 0.5042191743850708, 0.5253421664237976, 0.5464650988578796, 0.5675880908966064, 0.5887110233306885, 0.6098340153694153, 0.6309570074081421, 0.6520799398422241, 0.6732028722763062, 0.694325864315033, 0.715448796749115, 0.7365717887878418, 0.7576947212219238, 0.7788177132606506, 0.7999407052993774, 0.8210636377334595, 0.8421866297721863, 0.8633096218109131, 0.8844325542449951, 0.9055555462837219, 0.926678478717804, 0.9478014707565308, 0.9689244031906128, 0.9900473952293396, 1.0111703872680664]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 7.0, 14.0, 10.0, 14.0, 20.0, 24.0, 19.0, 30.0, 36.0, 29.0, 36.0, 52.0, 43.0, 54.0, 49.0, 47.0, 48.0, 60.0, 46.0, 41.0, 44.0, 39.0, 31.0, 31.0, 28.0, 24.0, 17.0, 17.0, 21.0, 16.0, 9.0, 9.0, 7.0, 10.0, 4.0, 0.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37087929248809814, -0.3571820557117462, -0.3434848487377167, -0.32978761196136475, -0.3160904049873352, -0.3023931682109833, -0.28869593143463135, -0.2749987244606018, -0.2613014876842499, -0.24760426580905914, -0.2339070439338684, -0.22020980715751648, -0.20651258528232574, -0.192815363407135, -0.17911812663078308, -0.16542090475559235, -0.1517236828804016, -0.13802646100521088, -0.12432923167943954, -0.11063200235366821, -0.09693478047847748, -0.08323755860328674, -0.06954032927751541, -0.05584309995174408, -0.042145878076553345, -0.02844865247607231, -0.014751426875591278, -0.0010542012751102448, 0.012643024325370789, 0.026340246200561523, 0.040037475526332855, 0.05373470485210419, 0.06743192672729492, 0.08112914860248566, 0.09482637792825699, 0.10852360725402832, 0.12222082912921906, 0.1359180510044098, 0.14961528778076172, 0.16331250965595245, 0.1770097315311432, 0.19070695340633392, 0.20440417528152466, 0.2181014120578766, 0.23179863393306732, 0.24549585580825806, 0.25919309258461, 0.2728903293609619, 0.28658753633499146, 0.3002847731113434, 0.3139819800853729, 0.32767921686172485, 0.3413764238357544, 0.3550736606121063, 0.36877089738845825, 0.3824681043624878, 0.3961653411388397, 0.40986257791519165, 0.4235597848892212, 0.4372570216655731, 0.45095425844192505, 0.4646514654159546, 0.4783487021923065, 0.49204593896865845, 0.505743145942688]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 8.0, 9.0, 6.0, 13.0, 18.0, 28.0, 51.0, 52.0, 81.0, 107.0, 174.0, 233.0, 336.0, 511.0, 745.0, 1041.0, 1687.0, 2511.0, 3922.0, 6111.0, 9665.0, 16550.0, 29108.0, 53893.0, 109851.0, 223865.0, 274704.0, 149939.0, 71874.0, 37614.0, 20610.0, 12050.0, 7510.0, 4595.0, 3014.0, 1976.0, 1299.0, 907.0, 531.0, 405.0, 273.0, 225.0, 132.0, 87.0, 70.0, 54.0, 37.0, 25.0, 15.0, 10.0, 8.0, 7.0, 3.0, 4.0, 0.0, 3.0, 0.0, 4.0], "bins": [-0.1585693359375, -0.15364646911621094, -0.14872360229492188, -0.1438007354736328, -0.13887786865234375, -0.1339550018310547, -0.12903213500976562, -0.12410926818847656, -0.1191864013671875, -0.11426353454589844, -0.10934066772460938, -0.10441780090332031, -0.09949493408203125, -0.09457206726074219, -0.08964920043945312, -0.08472633361816406, -0.079803466796875, -0.07488059997558594, -0.06995773315429688, -0.06503486633300781, -0.06011199951171875, -0.05518913269042969, -0.050266265869140625, -0.04534339904785156, -0.0404205322265625, -0.03549766540527344, -0.030574798583984375, -0.025651931762695312, -0.02072906494140625, -0.015806198120117188, -0.010883331298828125, -0.0059604644775390625, -0.00103759765625, 0.0038852691650390625, 0.008808135986328125, 0.013731002807617188, 0.01865386962890625, 0.023576736450195312, 0.028499603271484375, 0.03342247009277344, 0.0383453369140625, 0.04326820373535156, 0.048191070556640625, 0.05311393737792969, 0.05803680419921875, 0.06295967102050781, 0.06788253784179688, 0.07280540466308594, 0.077728271484375, 0.08265113830566406, 0.08757400512695312, 0.09249687194824219, 0.09741973876953125, 0.10234260559082031, 0.10726547241210938, 0.11218833923339844, 0.1171112060546875, 0.12203407287597656, 0.12695693969726562, 0.1318798065185547, 0.13680267333984375, 0.1417255401611328, 0.14664840698242188, 0.15157127380371094, 0.156494140625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 6.0, 5.0, 3.0, 9.0, 9.0, 9.0, 8.0, 10.0, 17.0, 22.0, 22.0, 25.0, 25.0, 28.0, 26.0, 38.0, 48.0, 43.0, 37.0, 48.0, 45.0, 43.0, 45.0, 52.0, 37.0, 46.0, 29.0, 29.0, 36.0, 26.0, 28.0, 22.0, 16.0, 23.0, 15.0, 13.0, 7.0, 10.0, 9.0, 7.0, 5.0, 3.0, 0.0, 2.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.057403564453125, -0.05576038360595703, -0.05411720275878906, -0.052474021911621094, -0.050830841064453125, -0.049187660217285156, -0.04754447937011719, -0.04590129852294922, -0.04425811767578125, -0.04261493682861328, -0.04097175598144531, -0.039328575134277344, -0.037685394287109375, -0.036042213439941406, -0.03439903259277344, -0.03275585174560547, -0.0311126708984375, -0.02946949005126953, -0.027826309204101562, -0.026183128356933594, -0.024539947509765625, -0.022896766662597656, -0.021253585815429688, -0.01961040496826172, -0.01796722412109375, -0.01632404327392578, -0.014680862426757812, -0.013037681579589844, -0.011394500732421875, -0.009751319885253906, -0.008108139038085938, -0.006464958190917969, -0.00482177734375, -0.0031785964965820312, -0.0015354156494140625, 0.00010776519775390625, 0.001750946044921875, 0.0033941268920898438, 0.0050373077392578125, 0.006680488586425781, 0.00832366943359375, 0.009966850280761719, 0.011610031127929688, 0.013253211975097656, 0.014896392822265625, 0.016539573669433594, 0.018182754516601562, 0.01982593536376953, 0.0214691162109375, 0.02311229705810547, 0.024755477905273438, 0.026398658752441406, 0.028041839599609375, 0.029685020446777344, 0.03132820129394531, 0.03297138214111328, 0.03461456298828125, 0.03625774383544922, 0.03790092468261719, 0.039544105529785156, 0.041187286376953125, 0.042830467224121094, 0.04447364807128906, 0.04611682891845703, 0.047760009765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 2.0, 12.0, 12.0, 12.0, 9.0, 22.0, 29.0, 62.0, 73.0, 92.0, 138.0, 238.0, 386.0, 691.0, 1280.0, 2344.0, 4407.0, 8535.0, 17668.0, 38966.0, 95918.0, 256465.0, 354914.0, 156132.0, 59175.0, 25710.0, 12156.0, 6014.0, 3113.0, 1683.0, 925.0, 534.0, 269.0, 163.0, 103.0, 81.0, 55.0, 44.0, 30.0, 24.0, 14.0, 14.0, 8.0, 7.0, 4.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.19091796875, -0.18517494201660156, -0.17943191528320312, -0.1736888885498047, -0.16794586181640625, -0.1622028350830078, -0.15645980834960938, -0.15071678161621094, -0.1449737548828125, -0.13923072814941406, -0.13348770141601562, -0.1277446746826172, -0.12200164794921875, -0.11625862121582031, -0.11051559448242188, -0.10477256774902344, -0.099029541015625, -0.09328651428222656, -0.08754348754882812, -0.08180046081542969, -0.07605743408203125, -0.07031440734863281, -0.06457138061523438, -0.05882835388183594, -0.0530853271484375, -0.04734230041503906, -0.041599273681640625, -0.03585624694824219, -0.03011322021484375, -0.024370193481445312, -0.018627166748046875, -0.012884140014648438, -0.00714111328125, -0.0013980865478515625, 0.004344940185546875, 0.010087966918945312, 0.01583099365234375, 0.021574020385742188, 0.027317047119140625, 0.03306007385253906, 0.0388031005859375, 0.04454612731933594, 0.050289154052734375, 0.05603218078613281, 0.06177520751953125, 0.06751823425292969, 0.07326126098632812, 0.07900428771972656, 0.084747314453125, 0.09049034118652344, 0.09623336791992188, 0.10197639465332031, 0.10771942138671875, 0.11346244812011719, 0.11920547485351562, 0.12494850158691406, 0.1306915283203125, 0.13643455505371094, 0.14217758178710938, 0.1479206085205078, 0.15366363525390625, 0.1594066619873047, 0.16514968872070312, 0.17089271545410156, 0.1766357421875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 9.0, 13.0, 9.0, 13.0, 14.0, 18.0, 23.0, 21.0, 24.0, 32.0, 32.0, 36.0, 40.0, 41.0, 42.0, 38.0, 53.0, 42.0, 43.0, 45.0, 42.0, 36.0, 37.0, 32.0, 31.0, 35.0, 37.0, 23.0, 17.0, 20.0, 14.0, 14.0, 11.0, 11.0, 10.0, 10.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11566162109375, -0.11175251007080078, -0.10784339904785156, -0.10393428802490234, -0.10002517700195312, -0.0961160659790039, -0.09220695495605469, -0.08829784393310547, -0.08438873291015625, -0.08047962188720703, -0.07657051086425781, -0.0726613998413086, -0.06875228881835938, -0.06484317779541016, -0.06093406677246094, -0.05702495574951172, -0.0531158447265625, -0.04920673370361328, -0.04529762268066406, -0.041388511657714844, -0.037479400634765625, -0.033570289611816406, -0.029661178588867188, -0.02575206756591797, -0.02184295654296875, -0.01793384552001953, -0.014024734497070312, -0.010115623474121094, -0.006206512451171875, -0.0022974014282226562, 0.0016117095947265625, 0.005520820617675781, 0.009429931640625, 0.013339042663574219, 0.017248153686523438, 0.021157264709472656, 0.025066375732421875, 0.028975486755371094, 0.03288459777832031, 0.03679370880126953, 0.04070281982421875, 0.04461193084716797, 0.04852104187011719, 0.052430152893066406, 0.056339263916015625, 0.060248374938964844, 0.06415748596191406, 0.06806659698486328, 0.0719757080078125, 0.07588481903076172, 0.07979393005371094, 0.08370304107666016, 0.08761215209960938, 0.0915212631225586, 0.09543037414550781, 0.09933948516845703, 0.10324859619140625, 0.10715770721435547, 0.11106681823730469, 0.1149759292602539, 0.11888504028320312, 0.12279415130615234, 0.12670326232910156, 0.13061237335205078, 0.134521484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 10.0, 20.0, 23.0, 26.0, 36.0, 39.0, 63.0, 91.0, 120.0, 180.0, 265.0, 364.0, 647.0, 978.0, 1861.0, 4226.0, 11860.0, 52827.0, 640048.0, 289439.0, 30022.0, 8280.0, 3151.0, 1471.0, 821.0, 553.0, 336.0, 270.0, 148.0, 88.0, 87.0, 58.0, 34.0, 25.0, 27.0, 16.0, 7.0, 9.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2261962890625, -0.21909141540527344, -0.21198654174804688, -0.2048816680908203, -0.19777679443359375, -0.1906719207763672, -0.18356704711914062, -0.17646217346191406, -0.1693572998046875, -0.16225242614746094, -0.15514755249023438, -0.1480426788330078, -0.14093780517578125, -0.1338329315185547, -0.12672805786132812, -0.11962318420410156, -0.112518310546875, -0.10541343688964844, -0.09830856323242188, -0.09120368957519531, -0.08409881591796875, -0.07699394226074219, -0.06988906860351562, -0.06278419494628906, -0.0556793212890625, -0.04857444763183594, -0.041469573974609375, -0.03436470031738281, -0.02725982666015625, -0.020154953002929688, -0.013050079345703125, -0.0059452056884765625, 0.00115966796875, 0.008264541625976562, 0.015369415283203125, 0.022474288940429688, 0.02957916259765625, 0.03668403625488281, 0.043788909912109375, 0.05089378356933594, 0.0579986572265625, 0.06510353088378906, 0.07220840454101562, 0.07931327819824219, 0.08641815185546875, 0.09352302551269531, 0.10062789916992188, 0.10773277282714844, 0.114837646484375, 0.12194252014160156, 0.12904739379882812, 0.1361522674560547, 0.14325714111328125, 0.1503620147705078, 0.15746688842773438, 0.16457176208496094, 0.1716766357421875, 0.17878150939941406, 0.18588638305664062, 0.1929912567138672, 0.20009613037109375, 0.2072010040283203, 0.21430587768554688, 0.22141075134277344, 0.228515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 7.0, 10.0, 12.0, 20.0, 30.0, 19.0, 57.0, 84.0, 148.0, 205.0, 141.0, 69.0, 46.0, 30.0, 20.0, 18.0, 21.0, 10.0, 9.0, 3.0, 6.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.950429916381836e-05, -2.8195790946483612e-05, -2.6887282729148865e-05, -2.5578774511814117e-05, -2.427026629447937e-05, -2.2961758077144623e-05, -2.1653249859809875e-05, -2.0344741642475128e-05, -1.903623342514038e-05, -1.7727725207805634e-05, -1.6419216990470886e-05, -1.5110708773136139e-05, -1.3802200555801392e-05, -1.2493692338466644e-05, -1.1185184121131897e-05, -9.87667590379715e-06, -8.568167686462402e-06, -7.259659469127655e-06, -5.951151251792908e-06, -4.64264303445816e-06, -3.334134817123413e-06, -2.0256265997886658e-06, -7.171183824539185e-07, 5.913898348808289e-07, 1.8998980522155762e-06, 3.2084062695503235e-06, 4.516914486885071e-06, 5.825422704219818e-06, 7.1339309215545654e-06, 8.442439138889313e-06, 9.75094735622406e-06, 1.1059455573558807e-05, 1.2367963790893555e-05, 1.3676472008228302e-05, 1.498498022556305e-05, 1.6293488442897797e-05, 1.7601996660232544e-05, 1.891050487756729e-05, 2.021901309490204e-05, 2.1527521312236786e-05, 2.2836029529571533e-05, 2.414453774690628e-05, 2.5453045964241028e-05, 2.6761554181575775e-05, 2.8070062398910522e-05, 2.937857061624527e-05, 3.068707883358002e-05, 3.1995587050914764e-05, 3.330409526824951e-05, 3.461260348558426e-05, 3.5921111702919006e-05, 3.7229619920253754e-05, 3.85381281375885e-05, 3.984663635492325e-05, 4.1155144572257996e-05, 4.246365278959274e-05, 4.377216100692749e-05, 4.508066922426224e-05, 4.6389177441596985e-05, 4.769768565893173e-05, 4.900619387626648e-05, 5.031470209360123e-05, 5.1623210310935974e-05, 5.293171852827072e-05, 5.424022674560547e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 0.0, 8.0, 10.0, 14.0, 25.0, 29.0, 57.0, 109.0, 157.0, 332.0, 645.0, 1291.0, 3121.0, 8555.0, 32525.0, 294712.0, 624217.0, 61870.0, 13089.0, 4299.0, 1757.0, 827.0, 369.0, 251.0, 111.0, 61.0, 45.0, 25.0, 14.0, 9.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148681640625, -0.14321136474609375, -0.1377410888671875, -0.13227081298828125, -0.126800537109375, -0.12133026123046875, -0.1158599853515625, -0.11038970947265625, -0.10491943359375, -0.09944915771484375, -0.0939788818359375, -0.08850860595703125, -0.083038330078125, -0.07756805419921875, -0.0720977783203125, -0.06662750244140625, -0.0611572265625, -0.05568695068359375, -0.0502166748046875, -0.04474639892578125, -0.039276123046875, -0.03380584716796875, -0.0283355712890625, -0.02286529541015625, -0.01739501953125, -0.01192474365234375, -0.0064544677734375, -0.00098419189453125, 0.004486083984375, 0.00995635986328125, 0.0154266357421875, 0.02089691162109375, 0.0263671875, 0.03183746337890625, 0.0373077392578125, 0.04277801513671875, 0.048248291015625, 0.05371856689453125, 0.0591888427734375, 0.06465911865234375, 0.07012939453125, 0.07559967041015625, 0.0810699462890625, 0.08654022216796875, 0.092010498046875, 0.09748077392578125, 0.1029510498046875, 0.10842132568359375, 0.1138916015625, 0.11936187744140625, 0.1248321533203125, 0.13030242919921875, 0.135772705078125, 0.14124298095703125, 0.1467132568359375, 0.15218353271484375, 0.15765380859375, 0.16312408447265625, 0.1685943603515625, 0.17406463623046875, 0.179534912109375, 0.18500518798828125, 0.1904754638671875, 0.19594573974609375, 0.201416015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 5.0, 4.0, 13.0, 13.0, 15.0, 21.0, 29.0, 49.0, 66.0, 77.0, 116.0, 130.0, 107.0, 93.0, 63.0, 46.0, 28.0, 27.0, 16.0, 16.0, 11.0, 12.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.08258056640625, -0.08025264739990234, -0.07792472839355469, -0.07559680938720703, -0.07326889038085938, -0.07094097137451172, -0.06861305236816406, -0.0662851333618164, -0.06395721435546875, -0.061629295349121094, -0.05930137634277344, -0.05697345733642578, -0.054645538330078125, -0.05231761932373047, -0.04998970031738281, -0.047661781311035156, -0.0453338623046875, -0.043005943298339844, -0.04067802429199219, -0.03835010528564453, -0.036022186279296875, -0.03369426727294922, -0.03136634826660156, -0.029038429260253906, -0.02671051025390625, -0.024382591247558594, -0.022054672241210938, -0.01972675323486328, -0.017398834228515625, -0.015070915222167969, -0.012742996215820312, -0.010415077209472656, -0.008087158203125, -0.005759239196777344, -0.0034313201904296875, -0.0011034011840820312, 0.001224517822265625, 0.0035524368286132812, 0.0058803558349609375, 0.008208274841308594, 0.01053619384765625, 0.012864112854003906, 0.015192031860351562, 0.01751995086669922, 0.019847869873046875, 0.02217578887939453, 0.024503707885742188, 0.026831626892089844, 0.0291595458984375, 0.031487464904785156, 0.03381538391113281, 0.03614330291748047, 0.038471221923828125, 0.04079914093017578, 0.04312705993652344, 0.045454978942871094, 0.04778289794921875, 0.050110816955566406, 0.05243873596191406, 0.05476665496826172, 0.057094573974609375, 0.05942249298095703, 0.06175041198730469, 0.06407833099365234, 0.06640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 9.0, 11.0, 32.0, 68.0, 147.0, 228.0, 225.0, 140.0, 67.0, 30.0, 28.0, 11.0, 5.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29053565859794617, -0.26106521487236023, -0.23159478604793549, -0.20212435722351074, -0.1726539134979248, -0.14318346977233887, -0.11371304094791412, -0.08424261212348938, -0.05477216839790344, -0.025301732122898102, 0.004168704152107239, 0.03363914042711258, 0.06310957670211792, 0.09258002042770386, 0.1220504492521286, 0.15152087807655334, 0.18099132180213928, 0.21046176552772522, 0.23993219435214996, 0.2694026231765747, 0.29887306690216064, 0.3283435106277466, 0.3578139543533325, 0.38728436827659607, 0.416754812002182, 0.44622525572776794, 0.4756956696510315, 0.5051661133766174, 0.5346365571022034, 0.5641070008277893, 0.5935774445533752, 0.6230478286743164, 0.6525182723999023, 0.6819887161254883, 0.7114591598510742, 0.7409296035766602, 0.7704000473022461, 0.799870491027832, 0.8293408751487732, 0.8588113188743591, 0.8882817625999451, 0.917752206325531, 0.9472226500511169, 0.9766930937767029, 1.006163477897644, 1.03563392162323, 1.065104365348816, 1.0945748090744019, 1.1240452527999878, 1.1535156965255737, 1.1829861402511597, 1.2124565839767456, 1.2419270277023315, 1.2713974714279175, 1.3008679151535034, 1.3303382396697998, 1.3598086833953857, 1.3892791271209717, 1.4187495708465576, 1.4482200145721436, 1.4776904582977295, 1.5071609020233154, 1.5366313457489014, 1.5661017894744873, 1.5955722332000732]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 2.0, 9.0, 16.0, 14.0, 6.0, 9.0, 13.0, 23.0, 26.0, 28.0, 31.0, 25.0, 37.0, 41.0, 38.0, 42.0, 50.0, 37.0, 43.0, 55.0, 45.0, 37.0, 36.0, 43.0, 30.0, 41.0, 26.0, 19.0, 36.0, 21.0, 24.0, 23.0, 14.0, 8.0, 11.0, 7.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38704580068588257, -0.37429752945899963, -0.3615492284297943, -0.3488009572029114, -0.33605265617370605, -0.3233043849468231, -0.3105560839176178, -0.29780781269073486, -0.28505951166152954, -0.2723112404346466, -0.2595629394054413, -0.24681465327739716, -0.23406636714935303, -0.2213180959224701, -0.20856979489326477, -0.19582152366638184, -0.1830732375383377, -0.17032495141029358, -0.15757666528224945, -0.14482837915420532, -0.1320800930261612, -0.11933181434869766, -0.10658352822065353, -0.0938352420926094, -0.08108695596456528, -0.06833866983652115, -0.05559038370847702, -0.04284210130572319, -0.030093815177679062, -0.017345532774925232, -0.0045972466468811035, 0.008151039481163025, 0.020899325609207153, 0.03364761173725128, 0.04639589786529541, 0.05914418026804924, 0.07189247012138367, 0.0846407487988472, 0.09738903492689133, 0.11013732105493546, 0.12288560718297958, 0.13563388586044312, 0.14838217198848724, 0.16113045811653137, 0.1738787442445755, 0.18662703037261963, 0.19937531650066376, 0.21212360262870789, 0.22487188875675201, 0.23762017488479614, 0.2503684461116791, 0.2631167471408844, 0.27586501836776733, 0.28861331939697266, 0.3013615906238556, 0.3141098916530609, 0.32685816287994385, 0.3396064341068268, 0.3523547351360321, 0.36510300636291504, 0.37785130739212036, 0.3905995786190033, 0.4033478796482086, 0.41609615087509155, 0.4288444519042969]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 11.0, 12.0, 14.0, 20.0, 24.0, 36.0, 67.0, 74.0, 102.0, 176.0, 272.0, 362.0, 619.0, 956.0, 1514.0, 2621.0, 4550.0, 8867.0, 18436.0, 44389.0, 153345.0, 1519080.0, 2126564.0, 213956.0, 53545.0, 21606.0, 10188.0, 5301.0, 2889.0, 1754.0, 980.0, 666.0, 446.0, 268.0, 171.0, 138.0, 81.0, 52.0, 41.0, 21.0, 21.0, 10.0, 15.0, 4.0, 4.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.125244140625, -0.12108230590820312, -0.11692047119140625, -0.11275863647460938, -0.1085968017578125, -0.10443496704101562, -0.10027313232421875, -0.09611129760742188, -0.091949462890625, -0.08778762817382812, -0.08362579345703125, -0.07946395874023438, -0.0753021240234375, -0.07114028930664062, -0.06697845458984375, -0.06281661987304688, -0.05865478515625, -0.054492950439453125, -0.05033111572265625, -0.046169281005859375, -0.0420074462890625, -0.037845611572265625, -0.03368377685546875, -0.029521942138671875, -0.025360107421875, -0.021198272705078125, -0.01703643798828125, -0.012874603271484375, -0.0087127685546875, -0.004550933837890625, -0.00038909912109375, 0.003772735595703125, 0.0079345703125, 0.012096405029296875, 0.01625823974609375, 0.020420074462890625, 0.0245819091796875, 0.028743743896484375, 0.03290557861328125, 0.037067413330078125, 0.041229248046875, 0.045391082763671875, 0.04955291748046875, 0.053714752197265625, 0.0578765869140625, 0.062038421630859375, 0.06620025634765625, 0.07036209106445312, 0.07452392578125, 0.07868576049804688, 0.08284759521484375, 0.08700942993164062, 0.0911712646484375, 0.09533309936523438, 0.09949493408203125, 0.10365676879882812, 0.107818603515625, 0.11198043823242188, 0.11614227294921875, 0.12030410766601562, 0.1244659423828125, 0.12862777709960938, 0.13278961181640625, 0.13695144653320312, 0.14111328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 3.0, 8.0, 10.0, 8.0, 14.0, 18.0, 18.0, 17.0, 23.0, 34.0, 33.0, 21.0, 42.0, 37.0, 44.0, 42.0, 38.0, 59.0, 56.0, 59.0, 39.0, 39.0, 40.0, 39.0, 38.0, 33.0, 34.0, 26.0, 27.0, 24.0, 12.0, 7.0, 13.0, 9.0, 5.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06622314453125, -0.06434822082519531, -0.062473297119140625, -0.06059837341308594, -0.05872344970703125, -0.05684852600097656, -0.054973602294921875, -0.05309867858886719, -0.0512237548828125, -0.04934883117675781, -0.047473907470703125, -0.04559898376464844, -0.04372406005859375, -0.04184913635253906, -0.039974212646484375, -0.03809928894042969, -0.036224365234375, -0.03434944152832031, -0.032474517822265625, -0.030599594116210938, -0.02872467041015625, -0.026849746704101562, -0.024974822998046875, -0.023099899291992188, -0.0212249755859375, -0.019350051879882812, -0.017475128173828125, -0.015600204467773438, -0.01372528076171875, -0.011850357055664062, -0.009975433349609375, -0.008100509643554688, -0.0062255859375, -0.0043506622314453125, -0.002475738525390625, -0.0006008148193359375, 0.00127410888671875, 0.0031490325927734375, 0.005023956298828125, 0.0068988800048828125, 0.0087738037109375, 0.010648727416992188, 0.012523651123046875, 0.014398574829101562, 0.01627349853515625, 0.018148422241210938, 0.020023345947265625, 0.021898269653320312, 0.023773193359375, 0.025648117065429688, 0.027523040771484375, 0.029397964477539062, 0.03127288818359375, 0.03314781188964844, 0.035022735595703125, 0.03689765930175781, 0.0387725830078125, 0.04064750671386719, 0.042522430419921875, 0.04439735412597656, 0.04627227783203125, 0.04814720153808594, 0.050022125244140625, 0.05189704895019531, 0.05377197265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 1.0, 7.0, 8.0, 5.0, 13.0, 25.0, 27.0, 44.0, 88.0, 133.0, 208.0, 356.0, 739.0, 1889.0, 5549.0, 21413.0, 119006.0, 1840967.0, 2044586.0, 126419.0, 22699.0, 6061.0, 2126.0, 901.0, 441.0, 230.0, 154.0, 75.0, 45.0, 26.0, 17.0, 13.0, 6.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.3603515625, -0.3519744873046875, -0.343597412109375, -0.3352203369140625, -0.32684326171875, -0.3184661865234375, -0.310089111328125, -0.3017120361328125, -0.2933349609375, -0.2849578857421875, -0.276580810546875, -0.2682037353515625, -0.25982666015625, -0.2514495849609375, -0.243072509765625, -0.2346954345703125, -0.226318359375, -0.2179412841796875, -0.209564208984375, -0.2011871337890625, -0.19281005859375, -0.1844329833984375, -0.176055908203125, -0.1676788330078125, -0.1593017578125, -0.1509246826171875, -0.142547607421875, -0.1341705322265625, -0.12579345703125, -0.1174163818359375, -0.109039306640625, -0.1006622314453125, -0.09228515625, -0.0839080810546875, -0.075531005859375, -0.0671539306640625, -0.05877685546875, -0.0503997802734375, -0.042022705078125, -0.0336456298828125, -0.0252685546875, -0.0168914794921875, -0.008514404296875, -0.0001373291015625, 0.00823974609375, 0.0166168212890625, 0.024993896484375, 0.0333709716796875, 0.041748046875, 0.0501251220703125, 0.058502197265625, 0.0668792724609375, 0.07525634765625, 0.0836334228515625, 0.092010498046875, 0.1003875732421875, 0.1087646484375, 0.1171417236328125, 0.125518798828125, 0.1338958740234375, 0.14227294921875, 0.1506500244140625, 0.159027099609375, 0.1674041748046875, 0.17578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 10.0, 15.0, 20.0, 46.0, 48.0, 83.0, 100.0, 134.0, 176.0, 358.0, 605.0, 807.0, 638.0, 386.0, 206.0, 131.0, 82.0, 64.0, 49.0, 21.0, 18.0, 23.0, 15.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11895751953125, -0.11370563507080078, -0.10845375061035156, -0.10320186614990234, -0.09794998168945312, -0.0926980972290039, -0.08744621276855469, -0.08219432830810547, -0.07694244384765625, -0.07169055938720703, -0.06643867492675781, -0.061186790466308594, -0.055934906005859375, -0.050683021545410156, -0.04543113708496094, -0.04017925262451172, -0.0349273681640625, -0.02967548370361328, -0.024423599243164062, -0.019171714782714844, -0.013919830322265625, -0.008667945861816406, -0.0034160614013671875, 0.0018358230590820312, 0.00708770751953125, 0.012339591979980469, 0.017591476440429688, 0.022843360900878906, 0.028095245361328125, 0.033347129821777344, 0.03859901428222656, 0.04385089874267578, 0.049102783203125, 0.05435466766357422, 0.05960655212402344, 0.06485843658447266, 0.07011032104492188, 0.0753622055053711, 0.08061408996582031, 0.08586597442626953, 0.09111785888671875, 0.09636974334716797, 0.10162162780761719, 0.1068735122680664, 0.11212539672851562, 0.11737728118896484, 0.12262916564941406, 0.12788105010986328, 0.1331329345703125, 0.13838481903076172, 0.14363670349121094, 0.14888858795166016, 0.15414047241210938, 0.1593923568725586, 0.1646442413330078, 0.16989612579345703, 0.17514801025390625, 0.18039989471435547, 0.1856517791748047, 0.1909036636352539, 0.19615554809570312, 0.20140743255615234, 0.20665931701660156, 0.21191120147705078, 0.2171630859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 11.0, 11.0, 30.0, 76.0, 193.0, 350.0, 204.0, 83.0, 28.0, 19.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9967993497848511, -0.9433290362358093, -0.8898587822914124, -0.8363884687423706, -0.7829182147979736, -0.7294479012489319, -0.6759775876998901, -0.6225073337554932, -0.5690370202064514, -0.5155667066574097, -0.4620964527130127, -0.40862613916397095, -0.3551558554172516, -0.3016855716705322, -0.24821525812149048, -0.19474497437477112, -0.14127469062805176, -0.0878043994307518, -0.03433410823345184, 0.01913619041442871, 0.07260647416114807, 0.12607675790786743, 0.17954707145690918, 0.23301735520362854, 0.2864876389503479, 0.33995792269706726, 0.3934282064437866, 0.44689851999282837, 0.5003688335418701, 0.5538390874862671, 0.6073094010353088, 0.6607797145843506, 0.714249849319458, 0.7677201628684998, 0.8211904168128967, 0.8746607303619385, 0.9281309843063354, 0.9816012978553772, 1.035071611404419, 1.088541865348816, 1.142012119293213, 1.1954823732376099, 1.2489527463912964, 1.3024230003356934, 1.3558932542800903, 1.4093635082244873, 1.4628338813781738, 1.5163041353225708, 1.5697745084762573, 1.6232447624206543, 1.6767151355743408, 1.7301853895187378, 1.7836556434631348, 1.8371260166168213, 1.8905962705612183, 1.9440665245056152, 1.9975368976593018, 2.0510072708129883, 2.1044774055480957, 2.1579477787017822, 2.2114181518554688, 2.264888286590576, 2.3183586597442627, 2.371829032897949, 2.4252991676330566]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 6.0, 8.0, 15.0, 18.0, 22.0, 17.0, 25.0, 33.0, 32.0, 43.0, 30.0, 45.0, 41.0, 50.0, 35.0, 47.0, 55.0, 64.0, 47.0, 48.0, 39.0, 46.0, 50.0, 35.0, 31.0, 20.0, 23.0, 14.0, 11.0, 12.0, 10.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4721795916557312, -0.4545271396636963, -0.4368746876716614, -0.41922223567962646, -0.40156978368759155, -0.38391733169555664, -0.36626487970352173, -0.3486124277114868, -0.3309599757194519, -0.313307523727417, -0.2956550717353821, -0.27800261974334717, -0.26035016775131226, -0.24269771575927734, -0.22504527866840363, -0.2073928266763687, -0.189740389585495, -0.17208793759346008, -0.15443548560142517, -0.13678303360939026, -0.11913058906793594, -0.10147813707590103, -0.08382569253444672, -0.0661732405424118, -0.04852078855037689, -0.03086833842098713, -0.013215888291597366, 0.004436559975147247, 0.02208901196718216, 0.03974146395921707, 0.05739390850067139, 0.0750463604927063, 0.09269881248474121, 0.11035126447677612, 0.12800371646881104, 0.14565616846084595, 0.16330862045288086, 0.18096107244491577, 0.1986135095357895, 0.2162659615278244, 0.23391841351985931, 0.25157085061073303, 0.26922330260276794, 0.28687575459480286, 0.30452820658683777, 0.3221806585788727, 0.3398331105709076, 0.3574855625629425, 0.3751380145549774, 0.39279046654701233, 0.41044291853904724, 0.42809537053108215, 0.44574782252311707, 0.463400274515152, 0.4810526967048645, 0.4987051486968994, 0.5163576006889343, 0.5340100526809692, 0.5516625046730042, 0.5693149566650391, 0.586967408657074, 0.6046198606491089, 0.6222723126411438, 0.6399247646331787, 0.6575772166252136]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 5.0, 12.0, 16.0, 32.0, 45.0, 68.0, 94.0, 169.0, 298.0, 484.0, 877.0, 1590.0, 2988.0, 5972.0, 11797.0, 25295.0, 56657.0, 135798.0, 285885.0, 282183.0, 133277.0, 56397.0, 24418.0, 11639.0, 5827.0, 3020.0, 1608.0, 892.0, 480.0, 282.0, 177.0, 104.0, 66.0, 25.0, 27.0, 21.0, 9.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1517333984375, -0.1468372344970703, -0.14194107055664062, -0.13704490661621094, -0.13214874267578125, -0.12725257873535156, -0.12235641479492188, -0.11746025085449219, -0.1125640869140625, -0.10766792297363281, -0.10277175903320312, -0.09787559509277344, -0.09297943115234375, -0.08808326721191406, -0.08318710327148438, -0.07829093933105469, -0.073394775390625, -0.06849861145019531, -0.06360244750976562, -0.05870628356933594, -0.05381011962890625, -0.04891395568847656, -0.044017791748046875, -0.03912162780761719, -0.0342254638671875, -0.029329299926757812, -0.024433135986328125, -0.019536972045898438, -0.01464080810546875, -0.009744644165039062, -0.004848480224609375, 4.76837158203125e-05, 0.00494384765625, 0.009840011596679688, 0.014736175537109375, 0.019632339477539062, 0.02452850341796875, 0.029424667358398438, 0.034320831298828125, 0.03921699523925781, 0.0441131591796875, 0.04900932312011719, 0.053905487060546875, 0.05880165100097656, 0.06369781494140625, 0.06859397888183594, 0.07349014282226562, 0.07838630676269531, 0.083282470703125, 0.08817863464355469, 0.09307479858398438, 0.09797096252441406, 0.10286712646484375, 0.10776329040527344, 0.11265945434570312, 0.11755561828613281, 0.1224517822265625, 0.1273479461669922, 0.13224411010742188, 0.13714027404785156, 0.14203643798828125, 0.14693260192871094, 0.15182876586914062, 0.1567249298095703, 0.16162109375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 10.0, 6.0, 15.0, 7.0, 15.0, 15.0, 21.0, 16.0, 35.0, 29.0, 37.0, 31.0, 46.0, 44.0, 51.0, 45.0, 54.0, 49.0, 52.0, 52.0, 53.0, 36.0, 45.0, 36.0, 42.0, 10.0, 32.0, 24.0, 27.0, 11.0, 16.0, 12.0, 5.0, 7.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.05535888671875, -0.05359649658203125, -0.0518341064453125, -0.05007171630859375, -0.048309326171875, -0.04654693603515625, -0.0447845458984375, -0.04302215576171875, -0.041259765625, -0.03949737548828125, -0.0377349853515625, -0.03597259521484375, -0.034210205078125, -0.03244781494140625, -0.0306854248046875, -0.02892303466796875, -0.02716064453125, -0.02539825439453125, -0.0236358642578125, -0.02187347412109375, -0.020111083984375, -0.01834869384765625, -0.0165863037109375, -0.01482391357421875, -0.0130615234375, -0.01129913330078125, -0.0095367431640625, -0.00777435302734375, -0.006011962890625, -0.00424957275390625, -0.0024871826171875, -0.00072479248046875, 0.00103759765625, 0.00279998779296875, 0.0045623779296875, 0.00632476806640625, 0.008087158203125, 0.00984954833984375, 0.0116119384765625, 0.01337432861328125, 0.01513671875, 0.01689910888671875, 0.0186614990234375, 0.02042388916015625, 0.022186279296875, 0.02394866943359375, 0.0257110595703125, 0.02747344970703125, 0.02923583984375, 0.03099822998046875, 0.0327606201171875, 0.03452301025390625, 0.036285400390625, 0.03804779052734375, 0.0398101806640625, 0.04157257080078125, 0.0433349609375, 0.04509735107421875, 0.0468597412109375, 0.04862213134765625, 0.050384521484375, 0.05214691162109375, 0.0539093017578125, 0.05567169189453125, 0.05743408203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 10.0, 7.0, 15.0, 26.0, 29.0, 39.0, 56.0, 90.0, 109.0, 154.0, 258.0, 369.0, 555.0, 863.0, 1348.0, 2239.0, 3640.0, 6556.0, 11878.0, 23019.0, 46218.0, 98171.0, 207272.0, 294649.0, 181373.0, 84431.0, 40098.0, 19905.0, 10459.0, 5756.0, 3292.0, 2045.0, 1246.0, 759.0, 519.0, 360.0, 223.0, 155.0, 105.0, 77.0, 53.0, 43.0, 25.0, 16.0, 14.0, 13.0, 11.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1507568359375, -0.1461048126220703, -0.14145278930664062, -0.13680076599121094, -0.13214874267578125, -0.12749671936035156, -0.12284469604492188, -0.11819267272949219, -0.1135406494140625, -0.10888862609863281, -0.10423660278320312, -0.09958457946777344, -0.09493255615234375, -0.09028053283691406, -0.08562850952148438, -0.08097648620605469, -0.076324462890625, -0.07167243957519531, -0.06702041625976562, -0.06236839294433594, -0.05771636962890625, -0.05306434631347656, -0.048412322998046875, -0.04376029968261719, -0.0391082763671875, -0.03445625305175781, -0.029804229736328125, -0.025152206420898438, -0.02050018310546875, -0.015848159790039062, -0.011196136474609375, -0.0065441131591796875, -0.00189208984375, 0.0027599334716796875, 0.007411956787109375, 0.012063980102539062, 0.01671600341796875, 0.021368026733398438, 0.026020050048828125, 0.030672073364257812, 0.0353240966796875, 0.03997611999511719, 0.044628143310546875, 0.04928016662597656, 0.05393218994140625, 0.05858421325683594, 0.06323623657226562, 0.06788825988769531, 0.072540283203125, 0.07719230651855469, 0.08184432983398438, 0.08649635314941406, 0.09114837646484375, 0.09580039978027344, 0.10045242309570312, 0.10510444641113281, 0.1097564697265625, 0.11440849304199219, 0.11906051635742188, 0.12371253967285156, 0.12836456298828125, 0.13301658630371094, 0.13766860961914062, 0.1423206329345703, 0.14697265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 2.0, 8.0, 6.0, 11.0, 5.0, 13.0, 15.0, 14.0, 15.0, 31.0, 29.0, 28.0, 26.0, 32.0, 33.0, 39.0, 43.0, 46.0, 44.0, 48.0, 39.0, 49.0, 54.0, 33.0, 41.0, 32.0, 40.0, 36.0, 34.0, 20.0, 31.0, 17.0, 18.0, 20.0, 6.0, 12.0, 6.0, 10.0, 10.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.12591171264648438, -0.12157440185546875, -0.11723709106445312, -0.1128997802734375, -0.10856246948242188, -0.10422515869140625, -0.09988784790039062, -0.095550537109375, -0.09121322631835938, -0.08687591552734375, -0.08253860473632812, -0.0782012939453125, -0.07386398315429688, -0.06952667236328125, -0.06518936157226562, -0.06085205078125, -0.056514739990234375, -0.05217742919921875, -0.047840118408203125, -0.0435028076171875, -0.039165496826171875, -0.03482818603515625, -0.030490875244140625, -0.026153564453125, -0.021816253662109375, -0.01747894287109375, -0.013141632080078125, -0.0088043212890625, -0.004467010498046875, -0.00012969970703125, 0.004207611083984375, 0.008544921875, 0.012882232666015625, 0.01721954345703125, 0.021556854248046875, 0.0258941650390625, 0.030231475830078125, 0.03456878662109375, 0.038906097412109375, 0.043243408203125, 0.047580718994140625, 0.05191802978515625, 0.056255340576171875, 0.0605926513671875, 0.06492996215820312, 0.06926727294921875, 0.07360458374023438, 0.07794189453125, 0.08227920532226562, 0.08661651611328125, 0.09095382690429688, 0.0952911376953125, 0.09962844848632812, 0.10396575927734375, 0.10830307006835938, 0.112640380859375, 0.11697769165039062, 0.12131500244140625, 0.12565231323242188, 0.1299896240234375, 0.13432693481445312, 0.13866424560546875, 0.14300155639648438, 0.1473388671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 12.0, 6.0, 19.0, 23.0, 52.0, 73.0, 138.0, 250.0, 535.0, 1179.0, 2921.0, 9335.0, 1013345.0, 14215.0, 3678.0, 1471.0, 612.0, 282.0, 156.0, 87.0, 48.0, 43.0, 17.0, 16.0, 7.0, 10.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.077117919921875, -1.04193115234375, -1.006744384765625, -0.9715576171875, -0.936370849609375, -0.90118408203125, -0.865997314453125, -0.830810546875, -0.795623779296875, -0.76043701171875, -0.725250244140625, -0.6900634765625, -0.654876708984375, -0.61968994140625, -0.584503173828125, -0.54931640625, -0.514129638671875, -0.47894287109375, -0.443756103515625, -0.4085693359375, -0.373382568359375, -0.33819580078125, -0.303009033203125, -0.267822265625, -0.232635498046875, -0.19744873046875, -0.162261962890625, -0.1270751953125, -0.091888427734375, -0.05670166015625, -0.021514892578125, 0.013671875, 0.048858642578125, 0.08404541015625, 0.119232177734375, 0.1544189453125, 0.189605712890625, 0.22479248046875, 0.259979248046875, 0.295166015625, 0.330352783203125, 0.36553955078125, 0.400726318359375, 0.4359130859375, 0.471099853515625, 0.50628662109375, 0.541473388671875, 0.57666015625, 0.611846923828125, 0.64703369140625, 0.682220458984375, 0.7174072265625, 0.752593994140625, 0.78778076171875, 0.822967529296875, 0.858154296875, 0.893341064453125, 0.92852783203125, 0.963714599609375, 0.9989013671875, 1.034088134765625, 1.06927490234375, 1.104461669921875, 1.1396484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 12.0, 157.0, 705.0, 108.0, 12.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022220611572265625, -0.0002174200490117073, -0.00021263398230075836, -0.00020784791558980942, -0.00020306184887886047, -0.00019827578216791153, -0.00019348971545696259, -0.00018870364874601364, -0.0001839175820350647, -0.00017913151532411575, -0.0001743454486131668, -0.00016955938190221786, -0.00016477331519126892, -0.00015998724848031998, -0.00015520118176937103, -0.0001504151150584221, -0.00014562904834747314, -0.0001408429816365242, -0.00013605691492557526, -0.0001312708482146263, -0.00012648478150367737, -0.00012169871479272842, -0.00011691264808177948, -0.00011212658137083054, -0.00010734051465988159, -0.00010255444794893265, -9.77683812379837e-05, -9.298231452703476e-05, -8.819624781608582e-05, -8.341018110513687e-05, -7.862411439418793e-05, -7.383804768323898e-05, -6.905198097229004e-05, -6.42659142613411e-05, -5.947984755039215e-05, -5.469378083944321e-05, -4.990771412849426e-05, -4.512164741754532e-05, -4.0335580706596375e-05, -3.554951399564743e-05, -3.0763447284698486e-05, -2.5977380573749542e-05, -2.1191313862800598e-05, -1.6405247151851654e-05, -1.161918044090271e-05, -6.833113729953766e-06, -2.0470470190048218e-06, 2.7390196919441223e-06, 7.525086402893066e-06, 1.231115311384201e-05, 1.7097219824790955e-05, 2.18832865357399e-05, 2.6669353246688843e-05, 3.145541995763779e-05, 3.624148666858673e-05, 4.1027553379535675e-05, 4.581362009048462e-05, 5.059968680143356e-05, 5.538575351238251e-05, 6.017182022333145e-05, 6.49578869342804e-05, 6.974395364522934e-05, 7.453002035617828e-05, 7.931608706712723e-05, 8.410215377807617e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 9.0, 10.0, 21.0, 26.0, 26.0, 44.0, 81.0, 122.0, 154.0, 261.0, 474.0, 808.0, 1407.0, 2528.0, 5108.0, 11077.0, 27129.0, 79319.0, 238458.0, 383515.0, 193634.0, 62764.0, 22469.0, 9233.0, 4531.0, 2298.0, 1260.0, 668.0, 393.0, 255.0, 145.0, 112.0, 69.0, 47.0, 29.0, 20.0, 11.0, 13.0, 6.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055023193359375, -0.053151607513427734, -0.05128002166748047, -0.0494084358215332, -0.04753684997558594, -0.04566526412963867, -0.043793678283691406, -0.04192209243774414, -0.040050506591796875, -0.03817892074584961, -0.036307334899902344, -0.03443574905395508, -0.03256416320800781, -0.030692577362060547, -0.02882099151611328, -0.026949405670166016, -0.02507781982421875, -0.023206233978271484, -0.02133464813232422, -0.019463062286376953, -0.017591476440429688, -0.015719890594482422, -0.013848304748535156, -0.01197671890258789, -0.010105133056640625, -0.00823354721069336, -0.006361961364746094, -0.004490375518798828, -0.0026187896728515625, -0.0007472038269042969, 0.0011243820190429688, 0.0029959678649902344, 0.0048675537109375, 0.006739139556884766, 0.008610725402832031, 0.010482311248779297, 0.012353897094726562, 0.014225482940673828, 0.016097068786621094, 0.01796865463256836, 0.019840240478515625, 0.02171182632446289, 0.023583412170410156, 0.025454998016357422, 0.027326583862304688, 0.029198169708251953, 0.03106975555419922, 0.032941341400146484, 0.03481292724609375, 0.036684513092041016, 0.03855609893798828, 0.04042768478393555, 0.04229927062988281, 0.04417085647583008, 0.046042442321777344, 0.04791402816772461, 0.049785614013671875, 0.05165719985961914, 0.053528785705566406, 0.05540037155151367, 0.05727195739746094, 0.0591435432434082, 0.06101512908935547, 0.06288671493530273, 0.06475830078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 8.0, 9.0, 7.0, 11.0, 21.0, 14.0, 15.0, 22.0, 30.0, 34.0, 52.0, 65.0, 61.0, 59.0, 57.0, 69.0, 59.0, 64.0, 53.0, 46.0, 35.0, 43.0, 30.0, 26.0, 19.0, 14.0, 12.0, 6.0, 6.0, 2.0, 3.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.031219482421875, -0.030238628387451172, -0.029257774353027344, -0.028276920318603516, -0.027296066284179688, -0.02631521224975586, -0.02533435821533203, -0.024353504180908203, -0.023372650146484375, -0.022391796112060547, -0.02141094207763672, -0.02043008804321289, -0.019449234008789062, -0.018468379974365234, -0.017487525939941406, -0.016506671905517578, -0.01552581787109375, -0.014544963836669922, -0.013564109802246094, -0.012583255767822266, -0.011602401733398438, -0.01062154769897461, -0.009640693664550781, -0.008659839630126953, -0.007678985595703125, -0.006698131561279297, -0.005717277526855469, -0.004736423492431641, -0.0037555694580078125, -0.0027747154235839844, -0.0017938613891601562, -0.0008130073547363281, 0.0001678466796875, 0.0011487007141113281, 0.0021295547485351562, 0.0031104087829589844, 0.0040912628173828125, 0.005072116851806641, 0.006052970886230469, 0.007033824920654297, 0.008014678955078125, 0.008995532989501953, 0.009976387023925781, 0.01095724105834961, 0.011938095092773438, 0.012918949127197266, 0.013899803161621094, 0.014880657196044922, 0.01586151123046875, 0.016842365264892578, 0.017823219299316406, 0.018804073333740234, 0.019784927368164062, 0.02076578140258789, 0.02174663543701172, 0.022727489471435547, 0.023708343505859375, 0.024689197540283203, 0.02567005157470703, 0.02665090560913086, 0.027631759643554688, 0.028612613677978516, 0.029593467712402344, 0.030574321746826172, 0.03155517578125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 15.0, 22.0, 78.0, 208.0, 348.0, 222.0, 72.0, 24.0, 8.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8911445140838623, -0.837341845035553, -0.7835391759872437, -0.7297364473342896, -0.6759337782859802, -0.6221311092376709, -0.5683284401893616, -0.5145257711410522, -0.46072307229042053, -0.4069204032421112, -0.3531177043914795, -0.29931503534317017, -0.24551235139369965, -0.19170966744422913, -0.1379069983959198, -0.08410429954528809, -0.03030163049697876, 0.023501049727201462, 0.07730372995138168, 0.1311064064502716, 0.18490909039974213, 0.23871177434921265, 0.292514443397522, 0.3463171422481537, 0.400119811296463, 0.45392248034477234, 0.507725179195404, 0.5615278482437134, 0.6153305172920227, 0.669133186340332, 0.7229359149932861, 0.7767385840415955, 0.8305412530899048, 0.8843439221382141, 0.9381465911865234, 0.9919493198394775, 1.045751929283142, 1.0995546579360962, 1.1533572673797607, 1.2071599960327148, 1.260962724685669, 1.314765453338623, 1.3685680627822876, 1.4223707914352417, 1.4761734008789062, 1.5299761295318604, 1.5837788581848145, 1.637581467628479, 1.6913840770721436, 1.7451868057250977, 1.7989894151687622, 1.8527921438217163, 1.9065947532653809, 1.960397481918335, 2.014200210571289, 2.068002939224243, 2.1218056678771973, 2.1756083965301514, 2.2294111251831055, 2.2832136154174805, 2.3370163440704346, 2.3908190727233887, 2.4446218013763428, 2.498424530029297, 2.552227020263672]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 4.0, 9.0, 7.0, 4.0, 14.0, 18.0, 22.0, 22.0, 28.0, 23.0, 27.0, 38.0, 28.0, 46.0, 32.0, 32.0, 54.0, 60.0, 52.0, 44.0, 41.0, 43.0, 37.0, 35.0, 36.0, 25.0, 31.0, 30.0, 28.0, 22.0, 19.0, 16.0, 14.0, 12.0, 8.0, 9.0, 12.0, 4.0, 4.0, 0.0, 3.0, 1.0, 3.0], "bins": [-0.5137677192687988, -0.5008597373962402, -0.4879518151283264, -0.4750438630580902, -0.462135910987854, -0.4492279291152954, -0.4363199770450592, -0.423412024974823, -0.4105040729045868, -0.3975961208343506, -0.3846881687641144, -0.3717802166938782, -0.3588722348213196, -0.34596431255340576, -0.33305633068084717, -0.32014837861061096, -0.30724042654037476, -0.29433247447013855, -0.28142452239990234, -0.26851657032966614, -0.25560861825942993, -0.24270065128803253, -0.22979268431663513, -0.21688473224639893, -0.20397678017616272, -0.1910688281059265, -0.1781608760356903, -0.1652529090642929, -0.1523449569940567, -0.1394370049238205, -0.1265290379524231, -0.11362108588218689, -0.10071313381195068, -0.08780518174171448, -0.07489722222089767, -0.06198926642537117, -0.049081310629844666, -0.03617335855960846, -0.023265399038791656, -0.010357439517974854, 0.0025505125522613525, 0.015458468347787857, 0.02836642414331436, 0.041274379938840866, 0.05418233573436737, 0.06709028780460358, 0.07999824732542038, 0.09290620684623718, 0.10581415891647339, 0.1187221109867096, 0.1316300630569458, 0.1445380300283432, 0.1574459820985794, 0.1703539341688156, 0.183261901140213, 0.19616985321044922, 0.20907780528068542, 0.22198575735092163, 0.23489370942115784, 0.24780167639255524, 0.26070964336395264, 0.27361756563186646, 0.28652554750442505, 0.29943349957466125, 0.31234145164489746]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 9.0, 4.0, 5.0, 5.0, 2.0, 6.0, 10.0, 7.0, 9.0, 15.0, 17.0, 19.0, 27.0, 27.0, 44.0, 44.0, 66.0, 108.0, 221.0, 513.0, 1870.0, 16164.0, 880083.0, 3258773.0, 31971.0, 2939.0, 637.0, 261.0, 104.0, 63.0, 53.0, 39.0, 35.0, 26.0, 22.0, 14.0, 13.0, 12.0, 12.0, 11.0, 4.0, 7.0, 5.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.394287109375, -0.3820152282714844, -0.36974334716796875, -0.3574714660644531, -0.3451995849609375, -0.3329277038574219, -0.32065582275390625, -0.3083839416503906, -0.296112060546875, -0.2838401794433594, -0.27156829833984375, -0.2592964172363281, -0.2470245361328125, -0.23475265502929688, -0.22248077392578125, -0.21020889282226562, -0.19793701171875, -0.18566513061523438, -0.17339324951171875, -0.16112136840820312, -0.1488494873046875, -0.13657760620117188, -0.12430572509765625, -0.11203384399414062, -0.099761962890625, -0.08749008178710938, -0.07521820068359375, -0.06294631958007812, -0.0506744384765625, -0.038402557373046875, -0.02613067626953125, -0.013858795166015625, -0.0015869140625, 0.010684967041015625, 0.02295684814453125, 0.035228729248046875, 0.0475006103515625, 0.059772491455078125, 0.07204437255859375, 0.08431625366210938, 0.096588134765625, 0.10886001586914062, 0.12113189697265625, 0.13340377807617188, 0.1456756591796875, 0.15794754028320312, 0.17021942138671875, 0.18249130249023438, 0.19476318359375, 0.20703506469726562, 0.21930694580078125, 0.23157882690429688, 0.2438507080078125, 0.2561225891113281, 0.26839447021484375, 0.2806663513183594, 0.292938232421875, 0.3052101135253906, 0.31748199462890625, 0.3297538757324219, 0.3420257568359375, 0.3542976379394531, 0.36656951904296875, 0.3788414001464844, 0.39111328125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 3.0, 5.0, 8.0, 6.0, 15.0, 11.0, 13.0, 15.0, 14.0, 19.0, 23.0, 30.0, 32.0, 28.0, 33.0, 34.0, 33.0, 36.0, 35.0, 41.0, 37.0, 34.0, 51.0, 44.0, 36.0, 41.0, 38.0, 30.0, 27.0, 30.0, 35.0, 30.0, 21.0, 14.0, 21.0, 12.0, 7.0, 9.0, 11.0, 5.0, 6.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0479736328125, -0.04642438888549805, -0.044875144958496094, -0.04332590103149414, -0.04177665710449219, -0.040227413177490234, -0.03867816925048828, -0.03712892532348633, -0.035579681396484375, -0.03403043746948242, -0.03248119354248047, -0.030931949615478516, -0.029382705688476562, -0.02783346176147461, -0.026284217834472656, -0.024734973907470703, -0.02318572998046875, -0.021636486053466797, -0.020087242126464844, -0.01853799819946289, -0.016988754272460938, -0.015439510345458984, -0.013890266418457031, -0.012341022491455078, -0.010791778564453125, -0.009242534637451172, -0.007693290710449219, -0.006144046783447266, -0.0045948028564453125, -0.0030455589294433594, -0.0014963150024414062, 5.2928924560546875e-05, 0.0016021728515625, 0.003151416778564453, 0.004700660705566406, 0.006249904632568359, 0.0077991485595703125, 0.009348392486572266, 0.010897636413574219, 0.012446880340576172, 0.013996124267578125, 0.015545368194580078, 0.01709461212158203, 0.018643856048583984, 0.020193099975585938, 0.02174234390258789, 0.023291587829589844, 0.024840831756591797, 0.02639007568359375, 0.027939319610595703, 0.029488563537597656, 0.03103780746459961, 0.03258705139160156, 0.034136295318603516, 0.03568553924560547, 0.03723478317260742, 0.038784027099609375, 0.04033327102661133, 0.04188251495361328, 0.043431758880615234, 0.04498100280761719, 0.04653024673461914, 0.048079490661621094, 0.04962873458862305, 0.051177978515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 9.0, 23.0, 26.0, 43.0, 65.0, 89.0, 144.0, 260.0, 394.0, 806.0, 1795.0, 4955.0, 17289.0, 89221.0, 891680.0, 2874629.0, 259569.0, 38533.0, 9089.0, 3034.0, 1187.0, 604.0, 323.0, 184.0, 116.0, 72.0, 50.0, 24.0, 16.0, 11.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1826171875, -0.17658233642578125, -0.1705474853515625, -0.16451263427734375, -0.158477783203125, -0.15244293212890625, -0.1464080810546875, -0.14037322998046875, -0.13433837890625, -0.12830352783203125, -0.1222686767578125, -0.11623382568359375, -0.110198974609375, -0.10416412353515625, -0.0981292724609375, -0.09209442138671875, -0.0860595703125, -0.08002471923828125, -0.0739898681640625, -0.06795501708984375, -0.061920166015625, -0.05588531494140625, -0.0498504638671875, -0.04381561279296875, -0.03778076171875, -0.03174591064453125, -0.0257110595703125, -0.01967620849609375, -0.013641357421875, -0.00760650634765625, -0.0015716552734375, 0.00446319580078125, 0.010498046875, 0.01653289794921875, 0.0225677490234375, 0.02860260009765625, 0.034637451171875, 0.04067230224609375, 0.0467071533203125, 0.05274200439453125, 0.05877685546875, 0.06481170654296875, 0.0708465576171875, 0.07688140869140625, 0.082916259765625, 0.08895111083984375, 0.0949859619140625, 0.10102081298828125, 0.1070556640625, 0.11309051513671875, 0.1191253662109375, 0.12516021728515625, 0.131195068359375, 0.13722991943359375, 0.1432647705078125, 0.14929962158203125, 0.15533447265625, 0.16136932373046875, 0.1674041748046875, 0.17343902587890625, 0.179473876953125, 0.18550872802734375, 0.1915435791015625, 0.19757843017578125, 0.20361328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 6.0, 14.0, 16.0, 22.0, 31.0, 42.0, 53.0, 103.0, 139.0, 177.0, 261.0, 396.0, 666.0, 668.0, 477.0, 312.0, 208.0, 125.0, 96.0, 64.0, 52.0, 44.0, 24.0, 19.0, 18.0, 11.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1103515625, -0.10628509521484375, -0.1022186279296875, -0.09815216064453125, -0.094085693359375, -0.09001922607421875, -0.0859527587890625, -0.08188629150390625, -0.07781982421875, -0.07375335693359375, -0.0696868896484375, -0.06562042236328125, -0.061553955078125, -0.05748748779296875, -0.0534210205078125, -0.04935455322265625, -0.0452880859375, -0.04122161865234375, -0.0371551513671875, -0.03308868408203125, -0.029022216796875, -0.02495574951171875, -0.0208892822265625, -0.01682281494140625, -0.01275634765625, -0.00868988037109375, -0.0046234130859375, -0.00055694580078125, 0.003509521484375, 0.00757598876953125, 0.0116424560546875, 0.01570892333984375, 0.019775390625, 0.02384185791015625, 0.0279083251953125, 0.03197479248046875, 0.036041259765625, 0.04010772705078125, 0.0441741943359375, 0.04824066162109375, 0.05230712890625, 0.05637359619140625, 0.0604400634765625, 0.06450653076171875, 0.068572998046875, 0.07263946533203125, 0.0767059326171875, 0.08077239990234375, 0.0848388671875, 0.08890533447265625, 0.0929718017578125, 0.09703826904296875, 0.101104736328125, 0.10517120361328125, 0.1092376708984375, 0.11330413818359375, 0.11737060546875, 0.12143707275390625, 0.1255035400390625, 0.12957000732421875, 0.133636474609375, 0.13770294189453125, 0.1417694091796875, 0.14583587646484375, 0.14990234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 7.0, 6.0, 5.0, 8.0, 10.0, 14.0, 26.0, 36.0, 56.0, 64.0, 128.0, 127.0, 128.0, 113.0, 83.0, 57.0, 47.0, 34.0, 21.0, 13.0, 3.0, 9.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51695317029953, -0.49932047724723816, -0.4816877841949463, -0.4640551209449768, -0.44642242789268494, -0.42878973484039307, -0.4111570715904236, -0.3935243785381317, -0.37589168548583984, -0.358258992433548, -0.3406262993812561, -0.3229936361312866, -0.30536094307899475, -0.2877282500267029, -0.2700955867767334, -0.25246289372444153, -0.23483020067214966, -0.2171975076198578, -0.1995648294687271, -0.18193215131759644, -0.16429945826530457, -0.1466667652130127, -0.12903408706188202, -0.11140140146017075, -0.09376871585845947, -0.0761360302567482, -0.058503344655036926, -0.04087065905332565, -0.02323797345161438, -0.005605287849903107, 0.012027397751808167, 0.02966008335351944, 0.04729276895523071, 0.06492545455694199, 0.08255814015865326, 0.10019082576036453, 0.1178235113620758, 0.13545620441436768, 0.15308888256549835, 0.17072156071662903, 0.1883542537689209, 0.20598694682121277, 0.22361962497234344, 0.24125230312347412, 0.258884996175766, 0.27651768922805786, 0.29415035247802734, 0.3117830455303192, 0.3294157385826111, 0.34704843163490295, 0.3646811246871948, 0.3823137879371643, 0.3999464809894562, 0.41757917404174805, 0.43521183729171753, 0.4528445303440094, 0.47047722339630127, 0.48810991644859314, 0.505742609500885, 0.5233752727508545, 0.5410079956054688, 0.5586406588554382, 0.5762733221054077, 0.593906044960022, 0.6115387082099915]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 8.0, 0.0, 9.0, 6.0, 8.0, 4.0, 6.0, 7.0, 14.0, 18.0, 19.0, 18.0, 29.0, 24.0, 29.0, 39.0, 43.0, 36.0, 38.0, 33.0, 26.0, 38.0, 45.0, 39.0, 42.0, 32.0, 37.0, 33.0, 41.0, 30.0, 34.0, 25.0, 29.0, 27.0, 17.0, 27.0, 20.0, 19.0, 7.0, 7.0, 14.0, 7.0, 6.0, 3.0, 3.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28948819637298584, -0.27887579798698425, -0.26826339960098267, -0.25765103101730347, -0.24703861773014069, -0.2364262342453003, -0.2258138358592987, -0.21520143747329712, -0.20458903908729553, -0.19397664070129395, -0.18336425721645355, -0.17275185883045197, -0.16213946044445038, -0.15152707695960999, -0.1409146785736084, -0.1303022801876068, -0.11968989670276642, -0.10907750576734543, -0.09846510738134384, -0.08785271644592285, -0.07724031805992126, -0.06662792712450027, -0.056015536189079285, -0.0454031378030777, -0.03479074686765671, -0.02417835220694542, -0.01356595940887928, -0.002953566610813141, 0.007658828049898148, 0.018271222710609436, 0.028883613646030426, 0.03949601203203201, 0.050108402967453, 0.06072079762816429, 0.07133319228887558, 0.08194558322429657, 0.09255798161029816, 0.10317037254571915, 0.11378276348114014, 0.12439516186714172, 0.1350075602531433, 0.1456199586391449, 0.1562323421239853, 0.16684474050998688, 0.17745713889598846, 0.18806952238082886, 0.19868192076683044, 0.20929431915283203, 0.21990670263767242, 0.230519101023674, 0.2411314845085144, 0.251743882894516, 0.2623562812805176, 0.27296867966651917, 0.28358107805252075, 0.29419344663619995, 0.30480584502220154, 0.3154182434082031, 0.3260306417942047, 0.3366430401802063, 0.3472554087638855, 0.3578678071498871, 0.36848020553588867, 0.37909260392189026, 0.38970500230789185]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 10.0, 12.0, 26.0, 24.0, 27.0, 51.0, 64.0, 88.0, 119.0, 181.0, 269.0, 446.0, 642.0, 1027.0, 1541.0, 2794.0, 4795.0, 8464.0, 16088.0, 30437.0, 61360.0, 123496.0, 228257.0, 256059.0, 153744.0, 76568.0, 37791.0, 19433.0, 10464.0, 5806.0, 3219.0, 1977.0, 1169.0, 693.0, 427.0, 304.0, 215.0, 144.0, 107.0, 71.0, 43.0, 29.0, 21.0, 15.0, 21.0, 4.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.12139892578125, -0.11737346649169922, -0.11334800720214844, -0.10932254791259766, -0.10529708862304688, -0.1012716293334961, -0.09724617004394531, -0.09322071075439453, -0.08919525146484375, -0.08516979217529297, -0.08114433288574219, -0.0771188735961914, -0.07309341430664062, -0.06906795501708984, -0.06504249572753906, -0.06101703643798828, -0.0569915771484375, -0.05296611785888672, -0.04894065856933594, -0.044915199279785156, -0.040889739990234375, -0.036864280700683594, -0.03283882141113281, -0.02881336212158203, -0.02478790283203125, -0.02076244354248047, -0.016736984252929688, -0.012711524963378906, -0.008686065673828125, -0.004660606384277344, -0.0006351470947265625, 0.0033903121948242188, 0.007415771484375, 0.011441230773925781, 0.015466690063476562, 0.019492149353027344, 0.023517608642578125, 0.027543067932128906, 0.03156852722167969, 0.03559398651123047, 0.03961944580078125, 0.04364490509033203, 0.04767036437988281, 0.051695823669433594, 0.055721282958984375, 0.059746742248535156, 0.06377220153808594, 0.06779766082763672, 0.0718231201171875, 0.07584857940673828, 0.07987403869628906, 0.08389949798583984, 0.08792495727539062, 0.0919504165649414, 0.09597587585449219, 0.10000133514404297, 0.10402679443359375, 0.10805225372314453, 0.11207771301269531, 0.1161031723022461, 0.12012863159179688, 0.12415409088134766, 0.12817955017089844, 0.13220500946044922, 0.13623046875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 10.0, 23.0, 33.0, 24.0, 33.0, 31.0, 57.0, 42.0, 47.0, 61.0, 41.0, 67.0, 69.0, 63.0, 49.0, 60.0, 34.0, 53.0, 36.0, 34.0, 27.0, 25.0, 22.0, 11.0, 9.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06402587890625, -0.0620269775390625, -0.060028076171875, -0.0580291748046875, -0.0560302734375, -0.0540313720703125, -0.052032470703125, -0.0500335693359375, -0.04803466796875, -0.0460357666015625, -0.044036865234375, -0.0420379638671875, -0.0400390625, -0.0380401611328125, -0.036041259765625, -0.0340423583984375, -0.03204345703125, -0.0300445556640625, -0.028045654296875, -0.0260467529296875, -0.0240478515625, -0.0220489501953125, -0.020050048828125, -0.0180511474609375, -0.01605224609375, -0.0140533447265625, -0.012054443359375, -0.0100555419921875, -0.008056640625, -0.0060577392578125, -0.004058837890625, -0.0020599365234375, -6.103515625e-05, 0.0019378662109375, 0.003936767578125, 0.0059356689453125, 0.0079345703125, 0.0099334716796875, 0.011932373046875, 0.0139312744140625, 0.01593017578125, 0.0179290771484375, 0.019927978515625, 0.0219268798828125, 0.02392578125, 0.0259246826171875, 0.027923583984375, 0.0299224853515625, 0.03192138671875, 0.0339202880859375, 0.035919189453125, 0.0379180908203125, 0.0399169921875, 0.0419158935546875, 0.043914794921875, 0.0459136962890625, 0.04791259765625, 0.0499114990234375, 0.051910400390625, 0.0539093017578125, 0.055908203125, 0.0579071044921875, 0.059906005859375, 0.0619049072265625, 0.06390380859375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 11.0, 11.0, 21.0, 18.0, 22.0, 30.0, 45.0, 70.0, 80.0, 150.0, 207.0, 350.0, 570.0, 1025.0, 2143.0, 4915.0, 13780.0, 43052.0, 155523.0, 448333.0, 270070.0, 72556.0, 21898.0, 7414.0, 2960.0, 1370.0, 707.0, 407.0, 259.0, 159.0, 122.0, 71.0, 56.0, 43.0, 23.0, 18.0, 14.0, 10.0, 7.0, 11.0, 9.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.226806640625, -0.22045516967773438, -0.21410369873046875, -0.20775222778320312, -0.2014007568359375, -0.19504928588867188, -0.18869781494140625, -0.18234634399414062, -0.175994873046875, -0.16964340209960938, -0.16329193115234375, -0.15694046020507812, -0.1505889892578125, -0.14423751831054688, -0.13788604736328125, -0.13153457641601562, -0.12518310546875, -0.11883163452148438, -0.11248016357421875, -0.10612869262695312, -0.0997772216796875, -0.09342575073242188, -0.08707427978515625, -0.08072280883789062, -0.074371337890625, -0.06801986694335938, -0.06166839599609375, -0.055316925048828125, -0.0489654541015625, -0.042613983154296875, -0.03626251220703125, -0.029911041259765625, -0.0235595703125, -0.017208099365234375, -0.01085662841796875, -0.004505157470703125, 0.0018463134765625, 0.008197784423828125, 0.01454925537109375, 0.020900726318359375, 0.027252197265625, 0.033603668212890625, 0.03995513916015625, 0.046306610107421875, 0.0526580810546875, 0.059009552001953125, 0.06536102294921875, 0.07171249389648438, 0.07806396484375, 0.08441543579101562, 0.09076690673828125, 0.09711837768554688, 0.1034698486328125, 0.10982131958007812, 0.11617279052734375, 0.12252426147460938, 0.128875732421875, 0.13522720336914062, 0.14157867431640625, 0.14793014526367188, 0.1542816162109375, 0.16063308715820312, 0.16698455810546875, 0.17333602905273438, 0.1796875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 8.0, 7.0, 12.0, 14.0, 11.0, 14.0, 27.0, 19.0, 28.0, 22.0, 26.0, 33.0, 45.0, 53.0, 38.0, 37.0, 37.0, 49.0, 45.0, 48.0, 37.0, 39.0, 42.0, 36.0, 30.0, 26.0, 27.0, 19.0, 28.0, 27.0, 23.0, 13.0, 16.0, 14.0, 10.0, 7.0, 8.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12249755859375, -0.11833477020263672, -0.11417198181152344, -0.11000919342041016, -0.10584640502929688, -0.1016836166381836, -0.09752082824707031, -0.09335803985595703, -0.08919525146484375, -0.08503246307373047, -0.08086967468261719, -0.0767068862915039, -0.07254409790039062, -0.06838130950927734, -0.06421852111816406, -0.06005573272705078, -0.0558929443359375, -0.05173015594482422, -0.04756736755371094, -0.043404579162597656, -0.039241790771484375, -0.035079002380371094, -0.030916213989257812, -0.02675342559814453, -0.02259063720703125, -0.01842784881591797, -0.014265060424804688, -0.010102272033691406, -0.005939483642578125, -0.0017766952514648438, 0.0023860931396484375, 0.006548881530761719, 0.010711669921875, 0.014874458312988281, 0.019037246704101562, 0.023200035095214844, 0.027362823486328125, 0.031525611877441406, 0.03568840026855469, 0.03985118865966797, 0.04401397705078125, 0.04817676544189453, 0.05233955383300781, 0.056502342224121094, 0.060665130615234375, 0.06482791900634766, 0.06899070739746094, 0.07315349578857422, 0.0773162841796875, 0.08147907257080078, 0.08564186096191406, 0.08980464935302734, 0.09396743774414062, 0.0981302261352539, 0.10229301452636719, 0.10645580291748047, 0.11061859130859375, 0.11478137969970703, 0.11894416809082031, 0.1231069564819336, 0.12726974487304688, 0.13143253326416016, 0.13559532165527344, 0.13975811004638672, 0.1439208984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 5.0, 11.0, 6.0, 5.0, 11.0, 23.0, 37.0, 41.0, 54.0, 89.0, 134.0, 264.0, 455.0, 864.0, 1988.0, 6331.0, 29666.0, 209702.0, 605552.0, 160906.0, 23458.0, 5282.0, 1822.0, 795.0, 404.0, 254.0, 153.0, 75.0, 46.0, 35.0, 28.0, 23.0, 8.0, 9.0, 5.0, 3.0, 1.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.08477783203125, -0.08257198333740234, -0.08036613464355469, -0.07816028594970703, -0.07595443725585938, -0.07374858856201172, -0.07154273986816406, -0.0693368911743164, -0.06713104248046875, -0.0649251937866211, -0.06271934509277344, -0.06051349639892578, -0.058307647705078125, -0.05610179901123047, -0.05389595031738281, -0.051690101623535156, -0.0494842529296875, -0.047278404235839844, -0.04507255554199219, -0.04286670684814453, -0.040660858154296875, -0.03845500946044922, -0.03624916076660156, -0.034043312072753906, -0.03183746337890625, -0.029631614685058594, -0.027425765991210938, -0.02521991729736328, -0.023014068603515625, -0.02080821990966797, -0.018602371215820312, -0.016396522521972656, -0.014190673828125, -0.011984825134277344, -0.009778976440429688, -0.007573127746582031, -0.005367279052734375, -0.0031614303588867188, -0.0009555816650390625, 0.0012502670288085938, 0.00345611572265625, 0.005661964416503906, 0.007867813110351562, 0.010073661804199219, 0.012279510498046875, 0.014485359191894531, 0.016691207885742188, 0.018897056579589844, 0.0211029052734375, 0.023308753967285156, 0.025514602661132812, 0.02772045135498047, 0.029926300048828125, 0.03213214874267578, 0.03433799743652344, 0.036543846130371094, 0.03874969482421875, 0.040955543518066406, 0.04316139221191406, 0.04536724090576172, 0.047573089599609375, 0.04977893829345703, 0.05198478698730469, 0.054190635681152344, 0.056396484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 4.0, 5.0, 2.0, 4.0, 7.0, 7.0, 6.0, 6.0, 12.0, 12.0, 14.0, 11.0, 23.0, 19.0, 39.0, 40.0, 37.0, 50.0, 41.0, 75.0, 60.0, 68.0, 59.0, 70.0, 53.0, 53.0, 39.0, 28.0, 27.0, 25.0, 22.0, 18.0, 10.0, 13.0, 7.0, 7.0, 4.0, 6.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.0132789611816406e-05, -9.814277291297913e-06, -9.495764970779419e-06, -9.177252650260925e-06, -8.858740329742432e-06, -8.540228009223938e-06, -8.221715688705444e-06, -7.90320336818695e-06, -7.584691047668457e-06, -7.266178727149963e-06, -6.94766640663147e-06, -6.629154086112976e-06, -6.310641765594482e-06, -5.992129445075989e-06, -5.673617124557495e-06, -5.3551048040390015e-06, -5.036592483520508e-06, -4.718080163002014e-06, -4.3995678424835205e-06, -4.081055521965027e-06, -3.762543201446533e-06, -3.4440308809280396e-06, -3.125518560409546e-06, -2.8070062398910522e-06, -2.4884939193725586e-06, -2.169981598854065e-06, -1.8514692783355713e-06, -1.5329569578170776e-06, -1.214444637298584e-06, -8.959323167800903e-07, -5.774199962615967e-07, -2.5890767574310303e-07, 5.960464477539063e-08, 3.781169652938843e-07, 6.966292858123779e-07, 1.0151416063308716e-06, 1.3336539268493652e-06, 1.6521662473678589e-06, 1.9706785678863525e-06, 2.289190888404846e-06, 2.60770320892334e-06, 2.9262155294418335e-06, 3.244727849960327e-06, 3.563240170478821e-06, 3.8817524909973145e-06, 4.200264811515808e-06, 4.518777132034302e-06, 4.837289452552795e-06, 5.155801773071289e-06, 5.474314093589783e-06, 5.792826414108276e-06, 6.11133873462677e-06, 6.429851055145264e-06, 6.748363375663757e-06, 7.066875696182251e-06, 7.385388016700745e-06, 7.703900337219238e-06, 8.022412657737732e-06, 8.340924978256226e-06, 8.65943729877472e-06, 8.977949619293213e-06, 9.296461939811707e-06, 9.6149742603302e-06, 9.933486580848694e-06, 1.0251998901367188e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 12.0, 22.0, 21.0, 40.0, 58.0, 93.0, 107.0, 167.0, 264.0, 480.0, 852.0, 1620.0, 3207.0, 7780.0, 23864.0, 93731.0, 392849.0, 391558.0, 93437.0, 23682.0, 7835.0, 3271.0, 1522.0, 784.0, 506.0, 276.0, 165.0, 109.0, 67.0, 51.0, 28.0, 13.0, 23.0, 9.0, 10.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.06396484375, -0.06213712692260742, -0.060309410095214844, -0.058481693267822266, -0.05665397644042969, -0.05482625961303711, -0.05299854278564453, -0.05117082595825195, -0.049343109130859375, -0.0475153923034668, -0.04568767547607422, -0.04385995864868164, -0.04203224182128906, -0.040204524993896484, -0.038376808166503906, -0.03654909133911133, -0.03472137451171875, -0.03289365768432617, -0.031065940856933594, -0.029238224029541016, -0.027410507202148438, -0.02558279037475586, -0.02375507354736328, -0.021927356719970703, -0.020099639892578125, -0.018271923065185547, -0.01644420623779297, -0.01461648941040039, -0.012788772583007812, -0.010961055755615234, -0.009133338928222656, -0.007305622100830078, -0.0054779052734375, -0.003650188446044922, -0.0018224716186523438, 5.245208740234375e-06, 0.0018329620361328125, 0.0036606788635253906, 0.005488395690917969, 0.007316112518310547, 0.009143829345703125, 0.010971546173095703, 0.012799263000488281, 0.01462697982788086, 0.016454696655273438, 0.018282413482666016, 0.020110130310058594, 0.021937847137451172, 0.02376556396484375, 0.025593280792236328, 0.027420997619628906, 0.029248714447021484, 0.031076431274414062, 0.03290414810180664, 0.03473186492919922, 0.0365595817565918, 0.038387298583984375, 0.04021501541137695, 0.04204273223876953, 0.04387044906616211, 0.04569816589355469, 0.047525882720947266, 0.049353599548339844, 0.05118131637573242, 0.053009033203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 0.0, 5.0, 4.0, 8.0, 5.0, 9.0, 6.0, 12.0, 11.0, 22.0, 11.0, 29.0, 35.0, 36.0, 58.0, 49.0, 51.0, 56.0, 82.0, 68.0, 66.0, 75.0, 41.0, 40.0, 41.0, 30.0, 28.0, 31.0, 11.0, 16.0, 12.0, 11.0, 8.0, 13.0, 9.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0306243896484375, -0.02964329719543457, -0.02866220474243164, -0.02768111228942871, -0.02670001983642578, -0.02571892738342285, -0.024737834930419922, -0.023756742477416992, -0.022775650024414062, -0.021794557571411133, -0.020813465118408203, -0.019832372665405273, -0.018851280212402344, -0.017870187759399414, -0.016889095306396484, -0.015908002853393555, -0.014926910400390625, -0.013945817947387695, -0.012964725494384766, -0.011983633041381836, -0.011002540588378906, -0.010021448135375977, -0.009040355682373047, -0.008059263229370117, -0.0070781707763671875, -0.006097078323364258, -0.005115985870361328, -0.0041348934173583984, -0.0031538009643554688, -0.002172708511352539, -0.0011916160583496094, -0.0002105236053466797, 0.00077056884765625, 0.0017516613006591797, 0.0027327537536621094, 0.003713846206665039, 0.004694938659667969, 0.0056760311126708984, 0.006657123565673828, 0.007638216018676758, 0.008619308471679688, 0.009600400924682617, 0.010581493377685547, 0.011562585830688477, 0.012543678283691406, 0.013524770736694336, 0.014505863189697266, 0.015486955642700195, 0.016468048095703125, 0.017449140548706055, 0.018430233001708984, 0.019411325454711914, 0.020392417907714844, 0.021373510360717773, 0.022354602813720703, 0.023335695266723633, 0.024316787719726562, 0.025297880172729492, 0.026278972625732422, 0.02726006507873535, 0.02824115753173828, 0.02922224998474121, 0.03020334243774414, 0.03118443489074707, 0.03216552734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 6.0, 6.0, 20.0, 64.0, 145.0, 325.0, 246.0, 119.0, 43.0, 18.0, 8.0, 7.0, 5.0, 0.0, 0.0, 1.0], "bins": [-2.054638385772705, -2.0165109634399414, -1.9783833026885986, -1.9402557611465454, -1.9021282196044922, -1.864000678062439, -1.8258731365203857, -1.7877455949783325, -1.7496180534362793, -1.711490511894226, -1.6733629703521729, -1.6352354288101196, -1.5971078872680664, -1.5589803457260132, -1.52085280418396, -1.4827252626419067, -1.4445977210998535, -1.4064701795578003, -1.368342638015747, -1.3302150964736938, -1.2920875549316406, -1.2539600133895874, -1.2158324718475342, -1.177704930305481, -1.1395775079727173, -1.101449966430664, -1.0633224248886108, -1.0251948833465576, -0.9870673418045044, -0.9489398002624512, -0.910812258720398, -0.8726847171783447, -0.8345571756362915, -0.7964296340942383, -0.7583020925521851, -0.7201745510101318, -0.6820470094680786, -0.6439194679260254, -0.6057919263839722, -0.567664384841919, -0.5295368432998657, -0.4914093017578125, -0.4532817602157593, -0.41515421867370605, -0.37702667713165283, -0.3388991355895996, -0.3007716238498688, -0.26264408230781555, -0.22451657056808472, -0.1863890290260315, -0.14826148748397827, -0.11013396084308624, -0.07200641930103302, -0.0338788777589798, 0.0042486488819122314, 0.042376190423965454, 0.08050373196601868, 0.1186312735080719, 0.15675881505012512, 0.19488634169101715, 0.23301388323307037, 0.2711414098739624, 0.3092689514160156, 0.34739649295806885, 0.38552403450012207]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 6.0, 8.0, 17.0, 18.0, 10.0, 19.0, 29.0, 18.0, 36.0, 25.0, 37.0, 40.0, 42.0, 50.0, 49.0, 37.0, 60.0, 52.0, 47.0, 45.0, 39.0, 48.0, 44.0, 35.0, 31.0, 25.0, 27.0, 16.0, 20.0, 15.0, 16.0, 16.0, 3.0, 5.0, 6.0, 3.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.410067081451416, -0.3960208296775818, -0.38197457790374756, -0.36792832612991333, -0.3538820743560791, -0.3398358225822449, -0.32578957080841064, -0.31174328923225403, -0.2976970374584198, -0.28365078568458557, -0.26960453391075134, -0.2555582821369171, -0.2415120154619217, -0.22746576368808746, -0.21341951191425323, -0.1993732452392578, -0.18532700836658478, -0.17128075659275055, -0.15723450481891632, -0.1431882381439209, -0.12914198637008667, -0.11509573459625244, -0.10104948282241821, -0.08700322359800339, -0.07295697182416916, -0.05891071632504463, -0.044864460825920105, -0.030818209052085876, -0.01677195355296135, -0.0027256980538368225, 0.011320553719997406, 0.02536681294441223, 0.03941306471824646, 0.05345932021737099, 0.06750557571649551, 0.08155182749032974, 0.09559808671474457, 0.1096443384885788, 0.12369059026241302, 0.13773685693740845, 0.15178310871124268, 0.1658293604850769, 0.17987561225891113, 0.19392186403274536, 0.20796813070774078, 0.222014382481575, 0.23606063425540924, 0.25010690093040466, 0.2641531229019165, 0.27819937467575073, 0.29224562644958496, 0.3062918782234192, 0.3203381299972534, 0.33438438177108765, 0.3484306335449219, 0.3624769151210785, 0.3765231668949127, 0.39056941866874695, 0.4046156704425812, 0.4186619222164154, 0.43270817399024963, 0.44675445556640625, 0.4608007073402405, 0.4748469591140747, 0.48889321088790894]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 7.0, 10.0, 15.0, 28.0, 23.0, 33.0, 75.0, 116.0, 195.0, 436.0, 958.0, 2431.0, 7754.0, 31736.0, 228124.0, 3349358.0, 507903.0, 48015.0, 11022.0, 3525.0, 1281.0, 597.0, 260.0, 163.0, 88.0, 44.0, 26.0, 24.0, 12.0, 11.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.1604766845703125, -0.155059814453125, -0.1496429443359375, -0.14422607421875, -0.1388092041015625, -0.133392333984375, -0.1279754638671875, -0.12255859375, -0.1171417236328125, -0.111724853515625, -0.1063079833984375, -0.10089111328125, -0.0954742431640625, -0.090057373046875, -0.0846405029296875, -0.0792236328125, -0.0738067626953125, -0.068389892578125, -0.0629730224609375, -0.05755615234375, -0.0521392822265625, -0.046722412109375, -0.0413055419921875, -0.035888671875, -0.0304718017578125, -0.025054931640625, -0.0196380615234375, -0.01422119140625, -0.0088043212890625, -0.003387451171875, 0.0020294189453125, 0.0074462890625, 0.0128631591796875, 0.018280029296875, 0.0236968994140625, 0.02911376953125, 0.0345306396484375, 0.039947509765625, 0.0453643798828125, 0.05078125, 0.0561981201171875, 0.061614990234375, 0.0670318603515625, 0.07244873046875, 0.0778656005859375, 0.083282470703125, 0.0886993408203125, 0.0941162109375, 0.0995330810546875, 0.104949951171875, 0.1103668212890625, 0.11578369140625, 0.1212005615234375, 0.126617431640625, 0.1320343017578125, 0.137451171875, 0.1428680419921875, 0.148284912109375, 0.1537017822265625, 0.15911865234375, 0.1645355224609375, 0.169952392578125, 0.1753692626953125, 0.1807861328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 6.0, 9.0, 9.0, 13.0, 16.0, 27.0, 34.0, 44.0, 33.0, 47.0, 66.0, 68.0, 81.0, 67.0, 70.0, 67.0, 70.0, 42.0, 62.0, 36.0, 25.0, 23.0, 23.0, 16.0, 23.0, 6.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07293701171875, -0.07077693939208984, -0.06861686706542969, -0.06645679473876953, -0.06429672241210938, -0.06213665008544922, -0.05997657775878906, -0.057816505432128906, -0.05565643310546875, -0.053496360778808594, -0.05133628845214844, -0.04917621612548828, -0.047016143798828125, -0.04485607147216797, -0.04269599914550781, -0.040535926818847656, -0.0383758544921875, -0.036215782165527344, -0.03405570983886719, -0.03189563751220703, -0.029735565185546875, -0.02757549285888672, -0.025415420532226562, -0.023255348205566406, -0.02109527587890625, -0.018935203552246094, -0.016775131225585938, -0.014615058898925781, -0.012454986572265625, -0.010294914245605469, -0.008134841918945312, -0.005974769592285156, -0.003814697265625, -0.0016546249389648438, 0.0005054473876953125, 0.0026655197143554688, 0.004825592041015625, 0.006985664367675781, 0.009145736694335938, 0.011305809020996094, 0.01346588134765625, 0.015625953674316406, 0.017786026000976562, 0.01994609832763672, 0.022106170654296875, 0.02426624298095703, 0.026426315307617188, 0.028586387634277344, 0.0307464599609375, 0.032906532287597656, 0.03506660461425781, 0.03722667694091797, 0.039386749267578125, 0.04154682159423828, 0.04370689392089844, 0.045866966247558594, 0.04802703857421875, 0.050187110900878906, 0.05234718322753906, 0.05450725555419922, 0.056667327880859375, 0.05882740020751953, 0.06098747253417969, 0.06314754486083984, 0.0653076171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 10.0, 3.0, 8.0, 11.0, 13.0, 35.0, 43.0, 72.0, 105.0, 232.0, 566.0, 2276.0, 22367.0, 1865100.0, 2275063.0, 24857.0, 2311.0, 598.0, 268.0, 148.0, 71.0, 44.0, 23.0, 24.0, 6.0, 9.0, 6.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.47509765625, -0.46430397033691406, -0.4535102844238281, -0.4427165985107422, -0.43192291259765625, -0.4211292266845703, -0.4103355407714844, -0.39954185485839844, -0.3887481689453125, -0.37795448303222656, -0.3671607971191406, -0.3563671112060547, -0.34557342529296875, -0.3347797393798828, -0.3239860534667969, -0.31319236755371094, -0.302398681640625, -0.29160499572753906, -0.2808113098144531, -0.2700176239013672, -0.25922393798828125, -0.2484302520751953, -0.23763656616210938, -0.22684288024902344, -0.2160491943359375, -0.20525550842285156, -0.19446182250976562, -0.1836681365966797, -0.17287445068359375, -0.1620807647705078, -0.15128707885742188, -0.14049339294433594, -0.12969970703125, -0.11890602111816406, -0.10811233520507812, -0.09731864929199219, -0.08652496337890625, -0.07573127746582031, -0.06493759155273438, -0.05414390563964844, -0.0433502197265625, -0.03255653381347656, -0.021762847900390625, -0.010969161987304688, -0.00017547607421875, 0.010618209838867188, 0.021411895751953125, 0.03220558166503906, 0.042999267578125, 0.05379295349121094, 0.06458663940429688, 0.07538032531738281, 0.08617401123046875, 0.09696769714355469, 0.10776138305664062, 0.11855506896972656, 0.1293487548828125, 0.14014244079589844, 0.15093612670898438, 0.1617298126220703, 0.17252349853515625, 0.1833171844482422, 0.19411087036132812, 0.20490455627441406, 0.2156982421875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 2.0, 4.0, 12.0, 12.0, 16.0, 24.0, 42.0, 51.0, 76.0, 111.0, 155.0, 224.0, 428.0, 759.0, 821.0, 512.0, 296.0, 162.0, 116.0, 83.0, 47.0, 36.0, 22.0, 16.0, 11.0, 7.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0804443359375, -0.07662773132324219, -0.07281112670898438, -0.06899452209472656, -0.06517791748046875, -0.06136131286621094, -0.057544708251953125, -0.05372810363769531, -0.0499114990234375, -0.04609489440917969, -0.042278289794921875, -0.03846168518066406, -0.03464508056640625, -0.030828475952148438, -0.027011871337890625, -0.023195266723632812, -0.019378662109375, -0.015562057495117188, -0.011745452880859375, -0.007928848266601562, -0.00411224365234375, -0.0002956390380859375, 0.003520965576171875, 0.0073375701904296875, 0.0111541748046875, 0.014970779418945312, 0.018787384033203125, 0.022603988647460938, 0.02642059326171875, 0.030237197875976562, 0.034053802490234375, 0.03787040710449219, 0.04168701171875, 0.04550361633300781, 0.049320220947265625, 0.05313682556152344, 0.05695343017578125, 0.06077003479003906, 0.06458663940429688, 0.06840324401855469, 0.0722198486328125, 0.07603645324707031, 0.07985305786132812, 0.08366966247558594, 0.08748626708984375, 0.09130287170410156, 0.09511947631835938, 0.09893608093261719, 0.102752685546875, 0.10656929016113281, 0.11038589477539062, 0.11420249938964844, 0.11801910400390625, 0.12183570861816406, 0.12565231323242188, 0.1294689178466797, 0.1332855224609375, 0.1371021270751953, 0.14091873168945312, 0.14473533630371094, 0.14855194091796875, 0.15236854553222656, 0.15618515014648438, 0.1600017547607422, 0.163818359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 9.0, 18.0, 90.0, 259.0, 396.0, 179.0, 31.0, 19.0, 6.0, 4.0, 3.0, 0.0, 1.0], "bins": [-2.58262300491333, -2.5358972549438477, -2.4891717433929443, -2.442445993423462, -2.3957202434539795, -2.348994731903076, -2.3022689819335938, -2.2555432319641113, -2.208817481994629, -2.1620917320251465, -2.115366220474243, -2.0686404705047607, -2.0219147205352783, -1.9751890897750854, -1.9284634590148926, -1.8817377090454102, -1.8350121974945068, -1.788286566734314, -1.7415608167648315, -1.6948351860046387, -1.6481094360351562, -1.6013838052749634, -1.5546581745147705, -1.507932424545288, -1.4612066745758057, -1.4144810438156128, -1.3677552938461304, -1.3210296630859375, -1.274303913116455, -1.2275782823562622, -1.1808526515960693, -1.134126901626587, -1.0874011516571045, -1.0406755208969116, -0.9939497709274292, -0.9472241401672363, -0.9004984498023987, -0.853772759437561, -0.8070470690727234, -0.7603213787078857, -0.7135957479476929, -0.6668700575828552, -0.6201443672180176, -0.5734187364578247, -0.5266930460929871, -0.4799673557281494, -0.43324166536331177, -0.3865160048007965, -0.33979034423828125, -0.2930646538734436, -0.24633899331092834, -0.1996133029460907, -0.15288762748241425, -0.10616195201873779, -0.059436261653900146, -0.012710601091384888, 0.03401508927345276, 0.08074076473712921, 0.12746644020080566, 0.1741921305656433, 0.22091780602931976, 0.2676434814929962, 0.31436917185783386, 0.3610948324203491, 0.40782052278518677]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 12.0, 5.0, 11.0, 13.0, 20.0, 15.0, 19.0, 15.0, 34.0, 26.0, 38.0, 36.0, 33.0, 33.0, 39.0, 53.0, 58.0, 50.0, 48.0, 51.0, 34.0, 41.0, 39.0, 36.0, 38.0, 38.0, 39.0, 25.0, 24.0, 15.0, 17.0, 9.0, 11.0, 11.0, 2.0, 7.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29742372035980225, -0.28716957569122314, -0.27691543102264404, -0.26666128635406494, -0.25640714168548584, -0.24615299701690674, -0.23589886724948883, -0.22564472258090973, -0.21539057791233063, -0.20513643324375153, -0.19488228857517242, -0.18462814390659332, -0.17437401413917542, -0.1641198694705963, -0.1538657248020172, -0.1436115801334381, -0.133357435464859, -0.12310329079627991, -0.1128491461277008, -0.1025950089097023, -0.0923408642411232, -0.0820867195725441, -0.0718325823545456, -0.06157843768596649, -0.05132429301738739, -0.04107014834880829, -0.030816007405519485, -0.020561864599585533, -0.01030772179365158, -5.357712507247925e-05, 0.010200563818216324, 0.020454704761505127, 0.03070884943008423, 0.04096299409866333, 0.05121713504195213, 0.061471275985240936, 0.07172542065382004, 0.08197956532239914, 0.09223370254039764, 0.10248784720897675, 0.11274199187755585, 0.12299613654613495, 0.13325028121471405, 0.14350442588329315, 0.15375855565071106, 0.16401270031929016, 0.17426684498786926, 0.18452098965644836, 0.19477513432502747, 0.20502927899360657, 0.21528342366218567, 0.22553756833076477, 0.23579171299934387, 0.24604585766792297, 0.2563000023365021, 0.2665541172027588, 0.2768082618713379, 0.287062406539917, 0.2973165512084961, 0.3075706958770752, 0.3178248405456543, 0.3280789852142334, 0.3383331298828125, 0.3485872745513916, 0.3588414192199707]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 7.0, 19.0, 13.0, 25.0, 26.0, 27.0, 50.0, 68.0, 100.0, 140.0, 204.0, 353.0, 704.0, 1224.0, 2710.0, 6005.0, 14893.0, 42372.0, 137954.0, 376074.0, 311612.0, 100594.0, 32068.0, 11747.0, 4794.0, 2238.0, 1026.0, 558.0, 310.0, 205.0, 124.0, 83.0, 82.0, 49.0, 19.0, 20.0, 13.0, 11.0, 4.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1326904296875, -0.1282482147216797, -0.12380599975585938, -0.11936378479003906, -0.11492156982421875, -0.11047935485839844, -0.10603713989257812, -0.10159492492675781, -0.0971527099609375, -0.09271049499511719, -0.08826828002929688, -0.08382606506347656, -0.07938385009765625, -0.07494163513183594, -0.07049942016601562, -0.06605720520019531, -0.061614990234375, -0.05717277526855469, -0.052730560302734375, -0.04828834533691406, -0.04384613037109375, -0.03940391540527344, -0.034961700439453125, -0.030519485473632812, -0.0260772705078125, -0.021635055541992188, -0.017192840576171875, -0.012750625610351562, -0.00830841064453125, -0.0038661956787109375, 0.000576019287109375, 0.0050182342529296875, 0.00946044921875, 0.013902664184570312, 0.018344879150390625, 0.022787094116210938, 0.02722930908203125, 0.03167152404785156, 0.036113739013671875, 0.04055595397949219, 0.0449981689453125, 0.04944038391113281, 0.053882598876953125, 0.05832481384277344, 0.06276702880859375, 0.06720924377441406, 0.07165145874023438, 0.07609367370605469, 0.080535888671875, 0.08497810363769531, 0.08942031860351562, 0.09386253356933594, 0.09830474853515625, 0.10274696350097656, 0.10718917846679688, 0.11163139343261719, 0.1160736083984375, 0.12051582336425781, 0.12495803833007812, 0.12940025329589844, 0.13384246826171875, 0.13828468322753906, 0.14272689819335938, 0.1471691131591797, 0.151611328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 13.0, 18.0, 15.0, 24.0, 36.0, 53.0, 53.0, 95.0, 79.0, 92.0, 87.0, 91.0, 74.0, 62.0, 55.0, 51.0, 32.0, 18.0, 18.0, 11.0, 10.0, 9.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06890869140625, -0.06647777557373047, -0.06404685974121094, -0.061615943908691406, -0.059185028076171875, -0.056754112243652344, -0.05432319641113281, -0.05189228057861328, -0.04946136474609375, -0.04703044891357422, -0.04459953308105469, -0.042168617248535156, -0.039737701416015625, -0.037306785583496094, -0.03487586975097656, -0.03244495391845703, -0.0300140380859375, -0.02758312225341797, -0.025152206420898438, -0.022721290588378906, -0.020290374755859375, -0.017859458923339844, -0.015428543090820312, -0.012997627258300781, -0.01056671142578125, -0.008135795593261719, -0.0057048797607421875, -0.0032739639282226562, -0.000843048095703125, 0.0015878677368164062, 0.0040187835693359375, 0.006449699401855469, 0.008880615234375, 0.011311531066894531, 0.013742446899414062, 0.016173362731933594, 0.018604278564453125, 0.021035194396972656, 0.023466110229492188, 0.02589702606201172, 0.02832794189453125, 0.03075885772705078, 0.03318977355957031, 0.035620689392089844, 0.038051605224609375, 0.040482521057128906, 0.04291343688964844, 0.04534435272216797, 0.0477752685546875, 0.05020618438720703, 0.05263710021972656, 0.055068016052246094, 0.057498931884765625, 0.059929847717285156, 0.06236076354980469, 0.06479167938232422, 0.06722259521484375, 0.06965351104736328, 0.07208442687988281, 0.07451534271240234, 0.07694625854492188, 0.0793771743774414, 0.08180809020996094, 0.08423900604248047, 0.086669921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 8.0, 6.0, 10.0, 9.0, 11.0, 22.0, 27.0, 23.0, 34.0, 39.0, 65.0, 92.0, 179.0, 347.0, 860.0, 2263.0, 6716.0, 20770.0, 71646.0, 268631.0, 453275.0, 159592.0, 43537.0, 13206.0, 4327.0, 1528.0, 581.0, 275.0, 113.0, 82.0, 63.0, 41.0, 32.0, 28.0, 24.0, 18.0, 18.0, 11.0, 7.0, 9.0, 6.0, 5.0, 1.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.14990234375, -0.1454010009765625, -0.140899658203125, -0.1363983154296875, -0.13189697265625, -0.1273956298828125, -0.122894287109375, -0.1183929443359375, -0.1138916015625, -0.1093902587890625, -0.104888916015625, -0.1003875732421875, -0.09588623046875, -0.0913848876953125, -0.086883544921875, -0.0823822021484375, -0.077880859375, -0.0733795166015625, -0.068878173828125, -0.0643768310546875, -0.05987548828125, -0.0553741455078125, -0.050872802734375, -0.0463714599609375, -0.0418701171875, -0.0373687744140625, -0.032867431640625, -0.0283660888671875, -0.02386474609375, -0.0193634033203125, -0.014862060546875, -0.0103607177734375, -0.005859375, -0.0013580322265625, 0.003143310546875, 0.0076446533203125, 0.01214599609375, 0.0166473388671875, 0.021148681640625, 0.0256500244140625, 0.0301513671875, 0.0346527099609375, 0.039154052734375, 0.0436553955078125, 0.04815673828125, 0.0526580810546875, 0.057159423828125, 0.0616607666015625, 0.066162109375, 0.0706634521484375, 0.075164794921875, 0.0796661376953125, 0.08416748046875, 0.0886688232421875, 0.093170166015625, 0.0976715087890625, 0.1021728515625, 0.1066741943359375, 0.111175537109375, 0.1156768798828125, 0.12017822265625, 0.1246795654296875, 0.129180908203125, 0.1336822509765625, 0.13818359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 4.0, 3.0, 11.0, 10.0, 13.0, 14.0, 18.0, 24.0, 23.0, 21.0, 17.0, 27.0, 22.0, 27.0, 26.0, 26.0, 26.0, 36.0, 37.0, 28.0, 35.0, 44.0, 44.0, 35.0, 36.0, 35.0, 34.0, 30.0, 31.0, 24.0, 17.0, 23.0, 34.0, 19.0, 17.0, 23.0, 18.0, 16.0, 9.0, 10.0, 11.0, 6.0, 9.0, 8.0, 4.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.08612060546875, -0.08334541320800781, -0.08057022094726562, -0.07779502868652344, -0.07501983642578125, -0.07224464416503906, -0.06946945190429688, -0.06669425964355469, -0.0639190673828125, -0.06114387512207031, -0.058368682861328125, -0.05559349060058594, -0.05281829833984375, -0.05004310607910156, -0.047267913818359375, -0.04449272155761719, -0.041717529296875, -0.03894233703613281, -0.036167144775390625, -0.03339195251464844, -0.03061676025390625, -0.027841567993164062, -0.025066375732421875, -0.022291183471679688, -0.0195159912109375, -0.016740798950195312, -0.013965606689453125, -0.011190414428710938, -0.00841522216796875, -0.0056400299072265625, -0.002864837646484375, -8.96453857421875e-05, 0.002685546875, 0.0054607391357421875, 0.008235931396484375, 0.011011123657226562, 0.01378631591796875, 0.016561508178710938, 0.019336700439453125, 0.022111892700195312, 0.0248870849609375, 0.027662277221679688, 0.030437469482421875, 0.03321266174316406, 0.03598785400390625, 0.03876304626464844, 0.041538238525390625, 0.04431343078613281, 0.047088623046875, 0.04986381530761719, 0.052639007568359375, 0.05541419982910156, 0.05818939208984375, 0.06096458435058594, 0.06373977661132812, 0.06651496887207031, 0.0692901611328125, 0.07206535339355469, 0.07484054565429688, 0.07761573791503906, 0.08039093017578125, 0.08316612243652344, 0.08594131469726562, 0.08871650695800781, 0.09149169921875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 6.0, 10.0, 17.0, 18.0, 36.0, 62.0, 104.0, 192.0, 355.0, 729.0, 1872.0, 5416.0, 20984.0, 105569.0, 445471.0, 367821.0, 76660.0, 15931.0, 4288.0, 1611.0, 662.0, 334.0, 172.0, 85.0, 62.0, 30.0, 18.0, 12.0, 7.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043487548828125, -0.04208040237426758, -0.040673255920410156, -0.039266109466552734, -0.03785896301269531, -0.03645181655883789, -0.03504467010498047, -0.03363752365112305, -0.032230377197265625, -0.030823230743408203, -0.02941608428955078, -0.02800893783569336, -0.026601791381835938, -0.025194644927978516, -0.023787498474121094, -0.022380352020263672, -0.02097320556640625, -0.019566059112548828, -0.018158912658691406, -0.016751766204833984, -0.015344619750976562, -0.01393747329711914, -0.012530326843261719, -0.011123180389404297, -0.009716033935546875, -0.008308887481689453, -0.006901741027832031, -0.005494594573974609, -0.0040874481201171875, -0.0026803016662597656, -0.0012731552124023438, 0.00013399124145507812, 0.0015411376953125, 0.002948284149169922, 0.004355430603027344, 0.005762577056884766, 0.0071697235107421875, 0.00857686996459961, 0.009984016418457031, 0.011391162872314453, 0.012798309326171875, 0.014205455780029297, 0.015612602233886719, 0.01701974868774414, 0.018426895141601562, 0.019834041595458984, 0.021241188049316406, 0.022648334503173828, 0.02405548095703125, 0.025462627410888672, 0.026869773864746094, 0.028276920318603516, 0.029684066772460938, 0.03109121322631836, 0.03249835968017578, 0.0339055061340332, 0.035312652587890625, 0.03671979904174805, 0.03812694549560547, 0.03953409194946289, 0.04094123840332031, 0.042348384857177734, 0.043755531311035156, 0.04516267776489258, 0.04656982421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 13.0, 9.0, 18.0, 18.0, 22.0, 15.0, 35.0, 33.0, 46.0, 30.0, 50.0, 59.0, 89.0, 59.0, 75.0, 56.0, 54.0, 60.0, 52.0, 40.0, 28.0, 25.0, 18.0, 21.0, 12.0, 12.0, 8.0, 12.0, 4.0, 6.0, 2.0, 3.0, 0.0, 5.0, 8.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.198883056640625e-06, -5.950219929218292e-06, -5.7015568017959595e-06, -5.452893674373627e-06, -5.204230546951294e-06, -4.955567419528961e-06, -4.706904292106628e-06, -4.458241164684296e-06, -4.209578037261963e-06, -3.96091490983963e-06, -3.7122517824172974e-06, -3.4635886549949646e-06, -3.214925527572632e-06, -2.966262400150299e-06, -2.7175992727279663e-06, -2.4689361453056335e-06, -2.2202730178833008e-06, -1.971609890460968e-06, -1.7229467630386353e-06, -1.4742836356163025e-06, -1.2256205081939697e-06, -9.76957380771637e-07, -7.282942533493042e-07, -4.796311259269714e-07, -2.3096799850463867e-07, 1.7695128917694092e-08, 2.6635825634002686e-07, 5.150213837623596e-07, 7.636845111846924e-07, 1.0123476386070251e-06, 1.261010766029358e-06, 1.5096738934516907e-06, 1.7583370208740234e-06, 2.007000148296356e-06, 2.255663275718689e-06, 2.5043264031410217e-06, 2.7529895305633545e-06, 3.0016526579856873e-06, 3.25031578540802e-06, 3.4989789128303528e-06, 3.7476420402526855e-06, 3.996305167675018e-06, 4.244968295097351e-06, 4.493631422519684e-06, 4.742294549942017e-06, 4.990957677364349e-06, 5.239620804786682e-06, 5.488283932209015e-06, 5.736947059631348e-06, 5.98561018705368e-06, 6.234273314476013e-06, 6.482936441898346e-06, 6.731599569320679e-06, 6.9802626967430115e-06, 7.228925824165344e-06, 7.477588951587677e-06, 7.72625207901001e-06, 7.974915206432343e-06, 8.223578333854675e-06, 8.472241461277008e-06, 8.72090458869934e-06, 8.969567716121674e-06, 9.218230843544006e-06, 9.466893970966339e-06, 9.715557098388672e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 13.0, 33.0, 43.0, 106.0, 255.0, 664.0, 2370.0, 13554.0, 141916.0, 719647.0, 152160.0, 14155.0, 2511.0, 648.0, 237.0, 120.0, 56.0, 32.0, 8.0, 11.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.06751728057861328, -0.06514930725097656, -0.06278133392333984, -0.060413360595703125, -0.058045387268066406, -0.05567741394042969, -0.05330944061279297, -0.05094146728515625, -0.04857349395751953, -0.04620552062988281, -0.043837547302246094, -0.041469573974609375, -0.039101600646972656, -0.03673362731933594, -0.03436565399169922, -0.0319976806640625, -0.02962970733642578, -0.027261734008789062, -0.024893760681152344, -0.022525787353515625, -0.020157814025878906, -0.017789840698242188, -0.015421867370605469, -0.01305389404296875, -0.010685920715332031, -0.008317947387695312, -0.005949974060058594, -0.003582000732421875, -0.0012140274047851562, 0.0011539459228515625, 0.0035219192504882812, 0.005889892578125, 0.008257865905761719, 0.010625839233398438, 0.012993812561035156, 0.015361785888671875, 0.017729759216308594, 0.020097732543945312, 0.02246570587158203, 0.02483367919921875, 0.02720165252685547, 0.029569625854492188, 0.031937599182128906, 0.034305572509765625, 0.036673545837402344, 0.03904151916503906, 0.04140949249267578, 0.0437774658203125, 0.04614543914794922, 0.04851341247558594, 0.050881385803222656, 0.053249359130859375, 0.055617332458496094, 0.05798530578613281, 0.06035327911376953, 0.06272125244140625, 0.06508922576904297, 0.06745719909667969, 0.0698251724243164, 0.07219314575195312, 0.07456111907958984, 0.07692909240722656, 0.07929706573486328, 0.0816650390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 9.0, 8.0, 9.0, 17.0, 19.0, 24.0, 33.0, 41.0, 44.0, 55.0, 74.0, 81.0, 92.0, 63.0, 67.0, 65.0, 58.0, 54.0, 47.0, 35.0, 21.0, 26.0, 17.0, 12.0, 5.0, 11.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03173828125, -0.03081345558166504, -0.029888629913330078, -0.028963804244995117, -0.028038978576660156, -0.027114152908325195, -0.026189327239990234, -0.025264501571655273, -0.024339675903320312, -0.02341485023498535, -0.02249002456665039, -0.02156519889831543, -0.02064037322998047, -0.019715547561645508, -0.018790721893310547, -0.017865896224975586, -0.016941070556640625, -0.016016244888305664, -0.015091419219970703, -0.014166593551635742, -0.013241767883300781, -0.01231694221496582, -0.01139211654663086, -0.010467290878295898, -0.009542465209960938, -0.008617639541625977, -0.007692813873291016, -0.006767988204956055, -0.005843162536621094, -0.004918336868286133, -0.003993511199951172, -0.003068685531616211, -0.00214385986328125, -0.001219034194946289, -0.0002942085266113281, 0.0006306171417236328, 0.0015554428100585938, 0.0024802684783935547, 0.0034050941467285156, 0.0043299198150634766, 0.0052547454833984375, 0.0061795711517333984, 0.007104396820068359, 0.00802922248840332, 0.008954048156738281, 0.009878873825073242, 0.010803699493408203, 0.011728525161743164, 0.012653350830078125, 0.013578176498413086, 0.014503002166748047, 0.015427827835083008, 0.01635265350341797, 0.01727747917175293, 0.01820230484008789, 0.01912713050842285, 0.020051956176757812, 0.020976781845092773, 0.021901607513427734, 0.022826433181762695, 0.023751258850097656, 0.024676084518432617, 0.025600910186767578, 0.02652573585510254, 0.0274505615234375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 12.0, 23.0, 43.0, 99.0, 156.0, 200.0, 205.0, 110.0, 63.0, 29.0, 22.0, 15.0, 3.0, 3.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6291400194168091, -0.6105483174324036, -0.591956615447998, -0.5733648538589478, -0.5547731518745422, -0.5361814498901367, -0.5175897479057312, -0.4989980161190033, -0.4804062843322754, -0.4618145823478699, -0.44322285056114197, -0.42463114857673645, -0.40603941679000854, -0.387447714805603, -0.3688560128211975, -0.3502642810344696, -0.3316725790500641, -0.31308087706565857, -0.29448914527893066, -0.27589744329452515, -0.25730571150779724, -0.23871400952339172, -0.220122292637825, -0.2015305757522583, -0.1829388588666916, -0.16434714198112488, -0.14575542509555817, -0.12716370820999146, -0.10857199877500534, -0.08998028188943863, -0.07138857245445251, -0.0527968555688858, -0.03420513868331909, -0.01561342366039753, 0.0029782913625240326, 0.021570004522800446, 0.04016172140836716, 0.05875343829393387, 0.07734514772891998, 0.0959368646144867, 0.1145285815000534, 0.13312029838562012, 0.15171201527118683, 0.17030373215675354, 0.18889543414115906, 0.20748716592788696, 0.22607886791229248, 0.2446705847978592, 0.2632623016834259, 0.2818540036678314, 0.3004457354545593, 0.31903743743896484, 0.33762916922569275, 0.35622087121009827, 0.37481260299682617, 0.3934043049812317, 0.4119960069656372, 0.4305877089500427, 0.44917944073677063, 0.46777114272117615, 0.48636287450790405, 0.5049545764923096, 0.5235462784767151, 0.5421379804611206, 0.5607297420501709]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 4.0, 6.0, 6.0, 5.0, 7.0, 10.0, 19.0, 14.0, 14.0, 22.0, 19.0, 27.0, 29.0, 24.0, 35.0, 41.0, 46.0, 39.0, 40.0, 39.0, 49.0, 37.0, 29.0, 45.0, 40.0, 32.0, 29.0, 27.0, 44.0, 41.0, 27.0, 19.0, 17.0, 26.0, 16.0, 16.0, 15.0, 16.0, 5.0, 8.0, 10.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.3699676990509033, -0.3599499464035034, -0.3499321937561035, -0.3399144411087036, -0.3298966884613037, -0.3198789358139038, -0.3098611831665039, -0.2998434007167816, -0.2898256480693817, -0.2798078954219818, -0.2697901427745819, -0.259772390127182, -0.2497546225786209, -0.239736869931221, -0.2297191172838211, -0.21970134973526, -0.2096836119890213, -0.1996658593416214, -0.1896481066942215, -0.1796303391456604, -0.1696125864982605, -0.1595948338508606, -0.1495770812034607, -0.1395593285560608, -0.1295415759086609, -0.11952382326126099, -0.10950606316328049, -0.09948831051588058, -0.08947055041790009, -0.07945279777050018, -0.06943504512310028, -0.05941728502511978, -0.04939952492713928, -0.03938176855444908, -0.02936401404440403, -0.01934625953435898, -0.009328503161668777, 0.0006892532110214233, 0.010707005858421326, 0.020724765956401825, 0.030742518603801727, 0.04076027497649193, 0.05077803134918213, 0.06079578399658203, 0.07081353664398193, 0.08083129674196243, 0.09084904938936234, 0.10086680948734283, 0.11088456213474274, 0.12090231478214264, 0.13092006742954254, 0.14093783497810364, 0.15095558762550354, 0.16097334027290344, 0.17099109292030334, 0.18100884556770325, 0.19102659821510315, 0.20104435086250305, 0.21106210350990295, 0.22107985615730286, 0.23109762370586395, 0.24111537635326385, 0.25113314390182495, 0.26115089654922485, 0.27116864919662476]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 6.0, 7.0, 11.0, 12.0, 26.0, 29.0, 47.0, 64.0, 99.0, 194.0, 332.0, 644.0, 1274.0, 2867.0, 7058.0, 20253.0, 72226.0, 537119.0, 2808339.0, 632454.0, 77919.0, 20838.0, 6876.0, 2796.0, 1281.0, 661.0, 333.0, 176.0, 122.0, 70.0, 42.0, 46.0, 22.0, 13.0, 6.0, 12.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.112548828125, -0.10928916931152344, -0.10602951049804688, -0.10276985168457031, -0.09951019287109375, -0.09625053405761719, -0.09299087524414062, -0.08973121643066406, -0.0864715576171875, -0.08321189880371094, -0.07995223999023438, -0.07669258117675781, -0.07343292236328125, -0.07017326354980469, -0.06691360473632812, -0.06365394592285156, -0.060394287109375, -0.05713462829589844, -0.053874969482421875, -0.05061531066894531, -0.04735565185546875, -0.04409599304199219, -0.040836334228515625, -0.03757667541503906, -0.0343170166015625, -0.031057357788085938, -0.027797698974609375, -0.024538040161132812, -0.02127838134765625, -0.018018722534179688, -0.014759063720703125, -0.011499404907226562, -0.00823974609375, -0.0049800872802734375, -0.001720428466796875, 0.0015392303466796875, 0.00479888916015625, 0.008058547973632812, 0.011318206787109375, 0.014577865600585938, 0.0178375244140625, 0.021097183227539062, 0.024356842041015625, 0.027616500854492188, 0.03087615966796875, 0.03413581848144531, 0.037395477294921875, 0.04065513610839844, 0.043914794921875, 0.04717445373535156, 0.050434112548828125, 0.05369377136230469, 0.05695343017578125, 0.06021308898925781, 0.06347274780273438, 0.06673240661621094, 0.0699920654296875, 0.07325172424316406, 0.07651138305664062, 0.07977104187011719, 0.08303070068359375, 0.08629035949707031, 0.08955001831054688, 0.09280967712402344, 0.0960693359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 17.0, 19.0, 27.0, 24.0, 33.0, 50.0, 54.0, 60.0, 75.0, 74.0, 98.0, 65.0, 71.0, 64.0, 53.0, 65.0, 42.0, 34.0, 20.0, 20.0, 12.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0814208984375, -0.07899761199951172, -0.07657432556152344, -0.07415103912353516, -0.07172775268554688, -0.0693044662475586, -0.06688117980957031, -0.06445789337158203, -0.06203460693359375, -0.05961132049560547, -0.05718803405761719, -0.054764747619628906, -0.052341461181640625, -0.049918174743652344, -0.04749488830566406, -0.04507160186767578, -0.0426483154296875, -0.04022502899169922, -0.03780174255371094, -0.035378456115722656, -0.032955169677734375, -0.030531883239746094, -0.028108596801757812, -0.02568531036376953, -0.02326202392578125, -0.02083873748779297, -0.018415451049804688, -0.015992164611816406, -0.013568878173828125, -0.011145591735839844, -0.008722305297851562, -0.006299018859863281, -0.003875732421875, -0.0014524459838867188, 0.0009708404541015625, 0.0033941268920898438, 0.005817413330078125, 0.008240699768066406, 0.010663986206054688, 0.013087272644042969, 0.01551055908203125, 0.01793384552001953, 0.020357131958007812, 0.022780418395996094, 0.025203704833984375, 0.027626991271972656, 0.030050277709960938, 0.03247356414794922, 0.0348968505859375, 0.03732013702392578, 0.03974342346191406, 0.042166709899902344, 0.044589996337890625, 0.047013282775878906, 0.04943656921386719, 0.05185985565185547, 0.05428314208984375, 0.05670642852783203, 0.05912971496582031, 0.061553001403808594, 0.06397628784179688, 0.06639957427978516, 0.06882286071777344, 0.07124614715576172, 0.07366943359375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 6.0, 13.0, 24.0, 26.0, 48.0, 80.0, 176.0, 400.0, 1283.0, 12747.0, 2297764.0, 1868085.0, 11638.0, 1238.0, 369.0, 154.0, 83.0, 45.0, 28.0, 22.0, 14.0, 10.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4367942810058594, -0.42559051513671875, -0.4143867492675781, -0.4031829833984375, -0.3919792175292969, -0.38077545166015625, -0.3695716857910156, -0.358367919921875, -0.3471641540527344, -0.33596038818359375, -0.3247566223144531, -0.3135528564453125, -0.3023490905761719, -0.29114532470703125, -0.2799415588378906, -0.26873779296875, -0.2575340270996094, -0.24633026123046875, -0.23512649536132812, -0.2239227294921875, -0.21271896362304688, -0.20151519775390625, -0.19031143188476562, -0.179107666015625, -0.16790390014648438, -0.15670013427734375, -0.14549636840820312, -0.1342926025390625, -0.12308883666992188, -0.11188507080078125, -0.10068130493164062, -0.0894775390625, -0.07827377319335938, -0.06707000732421875, -0.055866241455078125, -0.0446624755859375, -0.033458709716796875, -0.02225494384765625, -0.011051177978515625, 0.000152587890625, 0.011356353759765625, 0.02256011962890625, 0.033763885498046875, 0.0449676513671875, 0.056171417236328125, 0.06737518310546875, 0.07857894897460938, 0.08978271484375, 0.10098648071289062, 0.11219024658203125, 0.12339401245117188, 0.1345977783203125, 0.14580154418945312, 0.15700531005859375, 0.16820907592773438, 0.179412841796875, 0.19061660766601562, 0.20182037353515625, 0.21302413940429688, 0.2242279052734375, 0.23543167114257812, 0.24663543701171875, 0.2578392028808594, 0.26904296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 7.0, 4.0, 4.0, 6.0, 19.0, 20.0, 22.0, 33.0, 54.0, 85.0, 153.0, 233.0, 462.0, 946.0, 929.0, 482.0, 254.0, 126.0, 71.0, 49.0, 42.0, 36.0, 13.0, 13.0, 6.0, 5.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09722900390625, -0.09317493438720703, -0.08912086486816406, -0.0850667953491211, -0.08101272583007812, -0.07695865631103516, -0.07290458679199219, -0.06885051727294922, -0.06479644775390625, -0.06074237823486328, -0.05668830871582031, -0.052634239196777344, -0.048580169677734375, -0.044526100158691406, -0.04047203063964844, -0.03641796112060547, -0.0323638916015625, -0.02830982208251953, -0.024255752563476562, -0.020201683044433594, -0.016147613525390625, -0.012093544006347656, -0.008039474487304688, -0.003985404968261719, 6.866455078125e-05, 0.004122734069824219, 0.008176803588867188, 0.012230873107910156, 0.016284942626953125, 0.020339012145996094, 0.024393081665039062, 0.02844715118408203, 0.032501220703125, 0.03655529022216797, 0.04060935974121094, 0.044663429260253906, 0.048717498779296875, 0.052771568298339844, 0.05682563781738281, 0.06087970733642578, 0.06493377685546875, 0.06898784637451172, 0.07304191589355469, 0.07709598541259766, 0.08115005493164062, 0.0852041244506836, 0.08925819396972656, 0.09331226348876953, 0.0973663330078125, 0.10142040252685547, 0.10547447204589844, 0.1095285415649414, 0.11358261108398438, 0.11763668060302734, 0.12169075012207031, 0.12574481964111328, 0.12979888916015625, 0.13385295867919922, 0.1379070281982422, 0.14196109771728516, 0.14601516723632812, 0.1500692367553711, 0.15412330627441406, 0.15817737579345703, 0.1622314453125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 13.0, 30.0, 66.0, 192.0, 252.0, 245.0, 111.0, 57.0, 16.0, 11.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8142618536949158, -0.7869841456413269, -0.759706437587738, -0.732428789138794, -0.7051510810852051, -0.6778733730316162, -0.6505956649780273, -0.6233179569244385, -0.5960402488708496, -0.5687625408172607, -0.5414848327636719, -0.514207124710083, -0.4869294762611389, -0.45965176820755005, -0.4323740601539612, -0.4050963521003723, -0.3778187036514282, -0.35054099559783936, -0.3232633173465729, -0.295985609292984, -0.26870793104171753, -0.24143022298812866, -0.2141525149345398, -0.18687482178211212, -0.15959712862968445, -0.13231943547725677, -0.1050417348742485, -0.07776403427124023, -0.05048634111881256, -0.023208647966384888, 0.0040690600872039795, 0.03134675323963165, 0.05862438678741455, 0.08590207993984222, 0.1131797805428505, 0.14045748114585876, 0.16773517429828644, 0.1950128674507141, 0.22229057550430298, 0.24956826865673065, 0.2768459618091583, 0.3041236698627472, 0.33140134811401367, 0.35867905616760254, 0.3859567642211914, 0.4132344424724579, 0.44051215052604675, 0.46778982877731323, 0.4950675368309021, 0.522345244884491, 0.5496229529380798, 0.5769006013870239, 0.6041783094406128, 0.6314560174942017, 0.6587337255477905, 0.6860114336013794, 0.7132891416549683, 0.7405668497085571, 0.767844557762146, 0.7951222658157349, 0.822399914264679, 0.8496776223182678, 0.8769553303718567, 0.9042330384254456, 0.9315106868743896]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 6.0, 4.0, 8.0, 15.0, 9.0, 10.0, 18.0, 18.0, 27.0, 26.0, 30.0, 36.0, 38.0, 40.0, 39.0, 43.0, 48.0, 36.0, 37.0, 54.0, 49.0, 39.0, 48.0, 32.0, 36.0, 35.0, 35.0, 28.0, 18.0, 21.0, 10.0, 20.0, 9.0, 17.0, 11.0, 12.0, 2.0, 13.0, 4.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2595297694206238, -0.2514130175113678, -0.24329626560211182, -0.23517951369285583, -0.22706276178359985, -0.21894600987434387, -0.2108292579650879, -0.2027125060558319, -0.19459575414657593, -0.18647900223731995, -0.17836225032806396, -0.17024549841880798, -0.162128746509552, -0.15401199460029602, -0.14589524269104004, -0.13777849078178406, -0.12966173887252808, -0.1215449869632721, -0.11342823505401611, -0.10531148314476013, -0.09719473123550415, -0.08907797932624817, -0.08096122741699219, -0.0728444755077362, -0.06472772359848022, -0.05661097168922424, -0.04849421977996826, -0.04037746787071228, -0.0322607159614563, -0.024143964052200317, -0.016027212142944336, -0.007910460233688354, 0.00020629167556762695, 0.008323043584823608, 0.01643979549407959, 0.02455654740333557, 0.03267329931259155, 0.040790051221847534, 0.048906803131103516, 0.0570235550403595, 0.06514030694961548, 0.07325705885887146, 0.08137381076812744, 0.08949056267738342, 0.0976073145866394, 0.10572406649589539, 0.11384081840515137, 0.12195757031440735, 0.13007432222366333, 0.1381910741329193, 0.1463078260421753, 0.15442457795143127, 0.16254132986068726, 0.17065808176994324, 0.17877483367919922, 0.1868915855884552, 0.19500833749771118, 0.20312508940696716, 0.21124184131622314, 0.21935859322547913, 0.2274753451347351, 0.2355920970439911, 0.24370884895324707, 0.25182560086250305, 0.25994235277175903]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 5.0, 8.0, 8.0, 13.0, 33.0, 31.0, 40.0, 61.0, 61.0, 122.0, 167.0, 275.0, 423.0, 757.0, 1474.0, 3048.0, 7491.0, 19823.0, 59489.0, 186408.0, 382731.0, 254793.0, 85424.0, 27707.0, 9860.0, 3979.0, 1903.0, 948.0, 530.0, 317.0, 182.0, 138.0, 85.0, 63.0, 41.0, 27.0, 28.0, 18.0, 10.0, 13.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1519775390625, -0.1473236083984375, -0.142669677734375, -0.1380157470703125, -0.13336181640625, -0.1287078857421875, -0.124053955078125, -0.1194000244140625, -0.11474609375, -0.1100921630859375, -0.105438232421875, -0.1007843017578125, -0.09613037109375, -0.0914764404296875, -0.086822509765625, -0.0821685791015625, -0.0775146484375, -0.0728607177734375, -0.068206787109375, -0.0635528564453125, -0.05889892578125, -0.0542449951171875, -0.049591064453125, -0.0449371337890625, -0.040283203125, -0.0356292724609375, -0.030975341796875, -0.0263214111328125, -0.02166748046875, -0.0170135498046875, -0.012359619140625, -0.0077056884765625, -0.0030517578125, 0.0016021728515625, 0.006256103515625, 0.0109100341796875, 0.01556396484375, 0.0202178955078125, 0.024871826171875, 0.0295257568359375, 0.0341796875, 0.0388336181640625, 0.043487548828125, 0.0481414794921875, 0.05279541015625, 0.0574493408203125, 0.062103271484375, 0.0667572021484375, 0.0714111328125, 0.0760650634765625, 0.080718994140625, 0.0853729248046875, 0.09002685546875, 0.0946807861328125, 0.099334716796875, 0.1039886474609375, 0.108642578125, 0.1132965087890625, 0.117950439453125, 0.1226043701171875, 0.12725830078125, 0.1319122314453125, 0.136566162109375, 0.1412200927734375, 0.1458740234375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 11.0, 21.0, 34.0, 39.0, 67.0, 73.0, 76.0, 84.0, 106.0, 77.0, 80.0, 88.0, 56.0, 56.0, 43.0, 27.0, 22.0, 9.0, 11.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0828857421875, -0.08035755157470703, -0.07782936096191406, -0.0753011703491211, -0.07277297973632812, -0.07024478912353516, -0.06771659851074219, -0.06518840789794922, -0.06266021728515625, -0.06013202667236328, -0.05760383605957031, -0.055075645446777344, -0.052547454833984375, -0.050019264221191406, -0.04749107360839844, -0.04496288299560547, -0.0424346923828125, -0.03990650177001953, -0.03737831115722656, -0.034850120544433594, -0.032321929931640625, -0.029793739318847656, -0.027265548706054688, -0.02473735809326172, -0.02220916748046875, -0.01968097686767578, -0.017152786254882812, -0.014624595642089844, -0.012096405029296875, -0.009568214416503906, -0.0070400238037109375, -0.004511833190917969, -0.001983642578125, 0.0005445480346679688, 0.0030727386474609375, 0.005600929260253906, 0.008129119873046875, 0.010657310485839844, 0.013185501098632812, 0.01571369171142578, 0.01824188232421875, 0.02077007293701172, 0.023298263549804688, 0.025826454162597656, 0.028354644775390625, 0.030882835388183594, 0.03341102600097656, 0.03593921661376953, 0.0384674072265625, 0.04099559783935547, 0.04352378845214844, 0.046051979064941406, 0.048580169677734375, 0.051108360290527344, 0.05363655090332031, 0.05616474151611328, 0.05869293212890625, 0.06122112274169922, 0.06374931335449219, 0.06627750396728516, 0.06880569458007812, 0.0713338851928711, 0.07386207580566406, 0.07639026641845703, 0.07891845703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 17.0, 21.0, 22.0, 30.0, 35.0, 45.0, 70.0, 92.0, 137.0, 174.0, 263.0, 444.0, 718.0, 1549.0, 3427.0, 8882.0, 29018.0, 112251.0, 389305.0, 361511.0, 99805.0, 25988.0, 8151.0, 3126.0, 1406.0, 734.0, 399.0, 248.0, 187.0, 133.0, 92.0, 59.0, 58.0, 34.0, 26.0, 15.0, 11.0, 13.0, 10.0, 9.0, 10.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1248779296875, -0.12056541442871094, -0.11625289916992188, -0.11194038391113281, -0.10762786865234375, -0.10331535339355469, -0.09900283813476562, -0.09469032287597656, -0.0903778076171875, -0.08606529235839844, -0.08175277709960938, -0.07744026184082031, -0.07312774658203125, -0.06881523132324219, -0.06450271606445312, -0.06019020080566406, -0.055877685546875, -0.05156517028808594, -0.047252655029296875, -0.04294013977050781, -0.03862762451171875, -0.03431510925292969, -0.030002593994140625, -0.025690078735351562, -0.0213775634765625, -0.017065048217773438, -0.012752532958984375, -0.008440017700195312, -0.00412750244140625, 0.0001850128173828125, 0.004497528076171875, 0.008810043334960938, 0.01312255859375, 0.017435073852539062, 0.021747589111328125, 0.026060104370117188, 0.03037261962890625, 0.03468513488769531, 0.038997650146484375, 0.04331016540527344, 0.0476226806640625, 0.05193519592285156, 0.056247711181640625, 0.06056022644042969, 0.06487274169921875, 0.06918525695800781, 0.07349777221679688, 0.07781028747558594, 0.082122802734375, 0.08643531799316406, 0.09074783325195312, 0.09506034851074219, 0.09937286376953125, 0.10368537902832031, 0.10799789428710938, 0.11231040954589844, 0.1166229248046875, 0.12093544006347656, 0.12524795532226562, 0.1295604705810547, 0.13387298583984375, 0.1381855010986328, 0.14249801635742188, 0.14681053161621094, 0.151123046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 1.0, 7.0, 11.0, 9.0, 11.0, 15.0, 21.0, 27.0, 22.0, 29.0, 31.0, 32.0, 36.0, 38.0, 48.0, 29.0, 36.0, 42.0, 48.0, 37.0, 49.0, 39.0, 43.0, 47.0, 44.0, 27.0, 31.0, 26.0, 21.0, 26.0, 22.0, 16.0, 10.0, 13.0, 11.0, 10.0, 7.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.1112060546875, -0.10800838470458984, -0.10481071472167969, -0.10161304473876953, -0.09841537475585938, -0.09521770477294922, -0.09202003479003906, -0.0888223648071289, -0.08562469482421875, -0.0824270248413086, -0.07922935485839844, -0.07603168487548828, -0.07283401489257812, -0.06963634490966797, -0.06643867492675781, -0.06324100494384766, -0.0600433349609375, -0.056845664978027344, -0.05364799499511719, -0.05045032501220703, -0.047252655029296875, -0.04405498504638672, -0.04085731506347656, -0.037659645080566406, -0.03446197509765625, -0.031264305114746094, -0.028066635131835938, -0.02486896514892578, -0.021671295166015625, -0.01847362518310547, -0.015275955200195312, -0.012078285217285156, -0.008880615234375, -0.005682945251464844, -0.0024852752685546875, 0.0007123947143554688, 0.003910064697265625, 0.007107734680175781, 0.010305404663085938, 0.013503074645996094, 0.01670074462890625, 0.019898414611816406, 0.023096084594726562, 0.02629375457763672, 0.029491424560546875, 0.03268909454345703, 0.03588676452636719, 0.039084434509277344, 0.0422821044921875, 0.045479774475097656, 0.04867744445800781, 0.05187511444091797, 0.055072784423828125, 0.05827045440673828, 0.06146812438964844, 0.0646657943725586, 0.06786346435546875, 0.0710611343383789, 0.07425880432128906, 0.07745647430419922, 0.08065414428710938, 0.08385181427001953, 0.08704948425292969, 0.09024715423583984, 0.09344482421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 3.0, 9.0, 13.0, 14.0, 28.0, 50.0, 67.0, 138.0, 350.0, 834.0, 1982.0, 8293.0, 228646.0, 784088.0, 19001.0, 3003.0, 1095.0, 478.0, 195.0, 84.0, 56.0, 36.0, 21.0, 15.0, 8.0, 17.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.13671875, -0.13233375549316406, -0.12794876098632812, -0.12356376647949219, -0.11917877197265625, -0.11479377746582031, -0.11040878295898438, -0.10602378845214844, -0.1016387939453125, -0.09725379943847656, -0.09286880493164062, -0.08848381042480469, -0.08409881591796875, -0.07971382141113281, -0.07532882690429688, -0.07094383239746094, -0.066558837890625, -0.06217384338378906, -0.057788848876953125, -0.05340385437011719, -0.04901885986328125, -0.04463386535644531, -0.040248870849609375, -0.03586387634277344, -0.0314788818359375, -0.027093887329101562, -0.022708892822265625, -0.018323898315429688, -0.01393890380859375, -0.009553909301757812, -0.005168914794921875, -0.0007839202880859375, 0.00360107421875, 0.007986068725585938, 0.012371063232421875, 0.016756057739257812, 0.02114105224609375, 0.025526046752929688, 0.029911041259765625, 0.03429603576660156, 0.0386810302734375, 0.04306602478027344, 0.047451019287109375, 0.05183601379394531, 0.05622100830078125, 0.06060600280761719, 0.06499099731445312, 0.06937599182128906, 0.073760986328125, 0.07814598083496094, 0.08253097534179688, 0.08691596984863281, 0.09130096435546875, 0.09568595886230469, 0.10007095336914062, 0.10445594787597656, 0.1088409423828125, 0.11322593688964844, 0.11761093139648438, 0.12199592590332031, 0.12638092041015625, 0.1307659149169922, 0.13515090942382812, 0.13953590393066406, 0.1439208984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 6.0, 6.0, 12.0, 11.0, 18.0, 21.0, 44.0, 41.0, 81.0, 77.0, 112.0, 114.0, 102.0, 81.0, 84.0, 45.0, 35.0, 24.0, 17.0, 12.0, 17.0, 7.0, 10.0, 6.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.704692840576172e-05, -1.65402889251709e-05, -1.6033649444580078e-05, -1.5527009963989258e-05, -1.5020370483398438e-05, -1.4513731002807617e-05, -1.4007091522216797e-05, -1.3500452041625977e-05, -1.2993812561035156e-05, -1.2487173080444336e-05, -1.1980533599853516e-05, -1.1473894119262695e-05, -1.0967254638671875e-05, -1.0460615158081055e-05, -9.953975677490234e-06, -9.447336196899414e-06, -8.940696716308594e-06, -8.434057235717773e-06, -7.927417755126953e-06, -7.420778274536133e-06, -6.9141387939453125e-06, -6.407499313354492e-06, -5.900859832763672e-06, -5.3942203521728516e-06, -4.887580871582031e-06, -4.380941390991211e-06, -3.874301910400391e-06, -3.3676624298095703e-06, -2.86102294921875e-06, -2.3543834686279297e-06, -1.8477439880371094e-06, -1.341104507446289e-06, -8.344650268554688e-07, -3.2782554626464844e-07, 1.7881393432617188e-07, 6.854534149169922e-07, 1.1920928955078125e-06, 1.6987323760986328e-06, 2.205371856689453e-06, 2.7120113372802734e-06, 3.2186508178710938e-06, 3.725290298461914e-06, 4.231929779052734e-06, 4.738569259643555e-06, 5.245208740234375e-06, 5.751848220825195e-06, 6.258487701416016e-06, 6.765127182006836e-06, 7.271766662597656e-06, 7.778406143188477e-06, 8.285045623779297e-06, 8.791685104370117e-06, 9.298324584960938e-06, 9.804964065551758e-06, 1.0311603546142578e-05, 1.0818243026733398e-05, 1.1324882507324219e-05, 1.1831521987915039e-05, 1.233816146850586e-05, 1.284480094909668e-05, 1.33514404296875e-05, 1.385807991027832e-05, 1.436471939086914e-05, 1.4871358871459961e-05, 1.537799835205078e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 4.0, 8.0, 8.0, 3.0, 13.0, 15.0, 19.0, 45.0, 63.0, 75.0, 87.0, 165.0, 211.0, 284.0, 410.0, 633.0, 858.0, 1283.0, 2009.0, 3337.0, 6600.0, 21371.0, 168037.0, 702475.0, 109183.0, 16825.0, 5704.0, 3051.0, 1872.0, 1160.0, 833.0, 593.0, 371.0, 307.0, 185.0, 122.0, 88.0, 69.0, 43.0, 43.0, 25.0, 16.0, 16.0, 13.0, 7.0, 8.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0738525390625, -0.0715017318725586, -0.06915092468261719, -0.06680011749267578, -0.06444931030273438, -0.06209850311279297, -0.05974769592285156, -0.057396888732910156, -0.05504608154296875, -0.052695274353027344, -0.05034446716308594, -0.04799365997314453, -0.045642852783203125, -0.04329204559326172, -0.04094123840332031, -0.038590431213378906, -0.0362396240234375, -0.033888816833496094, -0.03153800964355469, -0.02918720245361328, -0.026836395263671875, -0.02448558807373047, -0.022134780883789062, -0.019783973693847656, -0.01743316650390625, -0.015082359313964844, -0.012731552124023438, -0.010380744934082031, -0.008029937744140625, -0.005679130554199219, -0.0033283233642578125, -0.0009775161743164062, 0.001373291015625, 0.0037240982055664062, 0.0060749053955078125, 0.008425712585449219, 0.010776519775390625, 0.013127326965332031, 0.015478134155273438, 0.017828941345214844, 0.02017974853515625, 0.022530555725097656, 0.024881362915039062, 0.02723217010498047, 0.029582977294921875, 0.03193378448486328, 0.03428459167480469, 0.036635398864746094, 0.0389862060546875, 0.041337013244628906, 0.04368782043457031, 0.04603862762451172, 0.048389434814453125, 0.05074024200439453, 0.05309104919433594, 0.055441856384277344, 0.05779266357421875, 0.060143470764160156, 0.06249427795410156, 0.06484508514404297, 0.06719589233398438, 0.06954669952392578, 0.07189750671386719, 0.0742483139038086, 0.07659912109375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 8.0, 13.0, 19.0, 15.0, 27.0, 40.0, 68.0, 80.0, 126.0, 155.0, 125.0, 93.0, 64.0, 48.0, 33.0, 19.0, 11.0, 9.0, 11.0, 5.0, 2.0, 2.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.038604736328125, -0.03709220886230469, -0.035579681396484375, -0.03406715393066406, -0.03255462646484375, -0.031042098999023438, -0.029529571533203125, -0.028017044067382812, -0.0265045166015625, -0.024991989135742188, -0.023479461669921875, -0.021966934204101562, -0.02045440673828125, -0.018941879272460938, -0.017429351806640625, -0.015916824340820312, -0.014404296875, -0.012891769409179688, -0.011379241943359375, -0.009866714477539062, -0.00835418701171875, -0.0068416595458984375, -0.005329132080078125, -0.0038166046142578125, -0.0023040771484375, -0.0007915496826171875, 0.000720977783203125, 0.0022335052490234375, 0.00374603271484375, 0.0052585601806640625, 0.006771087646484375, 0.008283615112304688, 0.009796142578125, 0.011308670043945312, 0.012821197509765625, 0.014333724975585938, 0.01584625244140625, 0.017358779907226562, 0.018871307373046875, 0.020383834838867188, 0.0218963623046875, 0.023408889770507812, 0.024921417236328125, 0.026433944702148438, 0.02794647216796875, 0.029458999633789062, 0.030971527099609375, 0.03248405456542969, 0.03399658203125, 0.03550910949707031, 0.037021636962890625, 0.03853416442871094, 0.04004669189453125, 0.04155921936035156, 0.043071746826171875, 0.04458427429199219, 0.0460968017578125, 0.04760932922363281, 0.049121856689453125, 0.05063438415527344, 0.05214691162109375, 0.05365943908691406, 0.055171966552734375, 0.05668449401855469, 0.058197021484375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 9.0, 23.0, 87.0, 418.0, 336.0, 99.0, 24.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6984809041023254, -0.6479597091674805, -0.5974385738372803, -0.5469173789024353, -0.4963962435722351, -0.44587504863739014, -0.39535388350486755, -0.34483271837234497, -0.2943115532398224, -0.2437903881072998, -0.19326922297477722, -0.14274804294109344, -0.09222687780857086, -0.041705697774887085, 0.008815467357635498, 0.05933663249015808, 0.10985779762268066, 0.16037896275520325, 0.21090012788772583, 0.2614213228225708, 0.311942458152771, 0.36246365308761597, 0.41298481822013855, 0.46350598335266113, 0.5140271186828613, 0.5645483136177063, 0.6150694489479065, 0.6655906438827515, 0.7161117792129517, 0.7666329741477966, 0.8171541690826416, 0.8676753044128418, 0.9181965589523315, 0.9687177538871765, 1.0192389488220215, 1.0697600841522217, 1.1202812194824219, 1.170802354812622, 1.2213236093521118, 1.271844744682312, 1.3223658800125122, 1.3728870153427124, 1.4234082698822021, 1.4739294052124023, 1.5244505405426025, 1.5749716758728027, 1.6254929304122925, 1.6760140657424927, 1.7265353202819824, 1.7770564556121826, 1.8275777101516724, 1.8780988454818726, 1.9286199808120728, 1.9791412353515625, 2.0296623706817627, 2.080183506011963, 2.130704641342163, 2.1812257766723633, 2.2317469120025635, 2.2822680473327637, 2.332789421081543, 2.383310556411743, 2.4338316917419434, 2.4843528270721436, 2.5348739624023438]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 7.0, 5.0, 12.0, 22.0, 19.0, 14.0, 24.0, 33.0, 36.0, 39.0, 29.0, 35.0, 30.0, 46.0, 42.0, 49.0, 38.0, 45.0, 39.0, 48.0, 51.0, 37.0, 34.0, 29.0, 35.0, 22.0, 32.0, 29.0, 14.0, 12.0, 12.0, 14.0, 12.0, 7.0, 12.0, 11.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3666459321975708, -0.3564077913761139, -0.346169650554657, -0.3359315097332001, -0.32569336891174316, -0.31545522809028625, -0.30521708726882935, -0.29497894644737244, -0.2847408056259155, -0.2745026648044586, -0.2642645239830017, -0.2540263831615448, -0.2437882423400879, -0.23355010151863098, -0.22331196069717407, -0.21307381987571716, -0.20283566415309906, -0.19259752333164215, -0.18235938251018524, -0.17212124168872833, -0.16188310086727142, -0.15164496004581451, -0.1414068043231964, -0.1311686635017395, -0.12093053013086319, -0.11069238930940628, -0.10045424848794937, -0.09021610021591187, -0.07997795939445496, -0.06973981857299805, -0.05950167775154114, -0.04926353693008423, -0.03902539610862732, -0.02878725528717041, -0.018549112603068352, -0.008310969918966293, 0.0019271709024906158, 0.012165311723947525, 0.022403456270694733, 0.03264159709215164, 0.04287973791360855, 0.05311787873506546, 0.06335601955652237, 0.07359416782855988, 0.08383230865001678, 0.0940704494714737, 0.1043085902929306, 0.11454673111438751, 0.12478487193584442, 0.13502301275730133, 0.14526115357875824, 0.15549929440021515, 0.16573743522167206, 0.17597557604312897, 0.18621373176574707, 0.19645187258720398, 0.2066900134086609, 0.2169281542301178, 0.2271662950515747, 0.23740443587303162, 0.24764257669448853, 0.25788071751594543, 0.26811885833740234, 0.27835699915885925, 0.28859513998031616]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 4.0, 9.0, 5.0, 15.0, 17.0, 44.0, 56.0, 76.0, 144.0, 271.0, 473.0, 929.0, 1993.0, 4451.0, 12427.0, 40217.0, 208663.0, 2448463.0, 1323310.0, 112102.0, 26317.0, 8213.0, 3070.0, 1348.0, 676.0, 378.0, 214.0, 130.0, 73.0, 61.0, 42.0, 26.0, 17.0, 12.0, 10.0, 7.0, 10.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08734130859375, -0.08382511138916016, -0.08030891418457031, -0.07679271697998047, -0.07327651977539062, -0.06976032257080078, -0.06624412536621094, -0.0627279281616211, -0.05921173095703125, -0.055695533752441406, -0.05217933654785156, -0.04866313934326172, -0.045146942138671875, -0.04163074493408203, -0.03811454772949219, -0.034598350524902344, -0.0310821533203125, -0.027565956115722656, -0.024049758911132812, -0.02053356170654297, -0.017017364501953125, -0.013501167297363281, -0.009984970092773438, -0.006468772888183594, -0.00295257568359375, 0.0005636215209960938, 0.0040798187255859375, 0.007596015930175781, 0.011112213134765625, 0.014628410339355469, 0.018144607543945312, 0.021660804748535156, 0.025177001953125, 0.028693199157714844, 0.03220939636230469, 0.03572559356689453, 0.039241790771484375, 0.04275798797607422, 0.04627418518066406, 0.049790382385253906, 0.05330657958984375, 0.056822776794433594, 0.06033897399902344, 0.06385517120361328, 0.06737136840820312, 0.07088756561279297, 0.07440376281738281, 0.07791996002197266, 0.0814361572265625, 0.08495235443115234, 0.08846855163574219, 0.09198474884033203, 0.09550094604492188, 0.09901714324951172, 0.10253334045410156, 0.1060495376586914, 0.10956573486328125, 0.1130819320678711, 0.11659812927246094, 0.12011432647705078, 0.12363052368164062, 0.12714672088623047, 0.1306629180908203, 0.13417911529541016, 0.1376953125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 14.0, 16.0, 26.0, 26.0, 40.0, 53.0, 63.0, 78.0, 81.0, 96.0, 83.0, 88.0, 75.0, 82.0, 52.0, 45.0, 28.0, 28.0, 7.0, 6.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08856201171875, -0.08579158782958984, -0.08302116394042969, -0.08025074005126953, -0.07748031616210938, -0.07470989227294922, -0.07193946838378906, -0.0691690444946289, -0.06639862060546875, -0.0636281967163086, -0.06085777282714844, -0.05808734893798828, -0.055316925048828125, -0.05254650115966797, -0.04977607727050781, -0.047005653381347656, -0.0442352294921875, -0.041464805603027344, -0.03869438171386719, -0.03592395782470703, -0.033153533935546875, -0.03038311004638672, -0.027612686157226562, -0.024842262268066406, -0.02207183837890625, -0.019301414489746094, -0.016530990600585938, -0.013760566711425781, -0.010990142822265625, -0.008219718933105469, -0.0054492950439453125, -0.0026788711547851562, 9.1552734375e-05, 0.0028619766235351562, 0.0056324005126953125, 0.008402824401855469, 0.011173248291015625, 0.013943672180175781, 0.016714096069335938, 0.019484519958496094, 0.02225494384765625, 0.025025367736816406, 0.027795791625976562, 0.03056621551513672, 0.033336639404296875, 0.03610706329345703, 0.03887748718261719, 0.041647911071777344, 0.0444183349609375, 0.047188758850097656, 0.04995918273925781, 0.05272960662841797, 0.055500030517578125, 0.05827045440673828, 0.06104087829589844, 0.0638113021850586, 0.06658172607421875, 0.0693521499633789, 0.07212257385253906, 0.07489299774169922, 0.07766342163085938, 0.08043384552001953, 0.08320426940917969, 0.08597469329833984, 0.0887451171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 9.0, 9.0, 13.0, 44.0, 47.0, 106.0, 218.0, 501.0, 1681.0, 19137.0, 3927851.0, 238655.0, 4443.0, 873.0, 346.0, 164.0, 95.0, 46.0, 21.0, 9.0, 9.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.268310546875, -0.2570152282714844, -0.24571990966796875, -0.23442459106445312, -0.2231292724609375, -0.21183395385742188, -0.20053863525390625, -0.18924331665039062, -0.177947998046875, -0.16665267944335938, -0.15535736083984375, -0.14406204223632812, -0.1327667236328125, -0.12147140502929688, -0.11017608642578125, -0.09888076782226562, -0.08758544921875, -0.07629013061523438, -0.06499481201171875, -0.053699493408203125, -0.0424041748046875, -0.031108856201171875, -0.01981353759765625, -0.008518218994140625, 0.002777099609375, 0.014072418212890625, 0.02536773681640625, 0.036663055419921875, 0.0479583740234375, 0.059253692626953125, 0.07054901123046875, 0.08184432983398438, 0.0931396484375, 0.10443496704101562, 0.11573028564453125, 0.12702560424804688, 0.1383209228515625, 0.14961624145507812, 0.16091156005859375, 0.17220687866210938, 0.183502197265625, 0.19479751586914062, 0.20609283447265625, 0.21738815307617188, 0.2286834716796875, 0.23997879028320312, 0.25127410888671875, 0.2625694274902344, 0.27386474609375, 0.2851600646972656, 0.29645538330078125, 0.3077507019042969, 0.3190460205078125, 0.3303413391113281, 0.34163665771484375, 0.3529319763183594, 0.364227294921875, 0.3755226135253906, 0.38681793212890625, 0.3981132507324219, 0.4094085693359375, 0.4207038879394531, 0.43199920654296875, 0.4432945251464844, 0.45458984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 11.0, 16.0, 17.0, 27.0, 38.0, 70.0, 66.0, 132.0, 186.0, 460.0, 819.0, 1026.0, 566.0, 212.0, 143.0, 73.0, 70.0, 37.0, 31.0, 17.0, 14.0, 9.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1121826171875, -0.10858154296875, -0.10498046875, -0.10137939453125, -0.0977783203125, -0.09417724609375, -0.090576171875, -0.08697509765625, -0.0833740234375, -0.07977294921875, -0.076171875, -0.07257080078125, -0.0689697265625, -0.06536865234375, -0.061767578125, -0.05816650390625, -0.0545654296875, -0.05096435546875, -0.04736328125, -0.04376220703125, -0.0401611328125, -0.03656005859375, -0.032958984375, -0.02935791015625, -0.0257568359375, -0.02215576171875, -0.0185546875, -0.01495361328125, -0.0113525390625, -0.00775146484375, -0.004150390625, -0.00054931640625, 0.0030517578125, 0.00665283203125, 0.01025390625, 0.01385498046875, 0.0174560546875, 0.02105712890625, 0.024658203125, 0.02825927734375, 0.0318603515625, 0.03546142578125, 0.0390625, 0.04266357421875, 0.0462646484375, 0.04986572265625, 0.053466796875, 0.05706787109375, 0.0606689453125, 0.06427001953125, 0.06787109375, 0.07147216796875, 0.0750732421875, 0.07867431640625, 0.082275390625, 0.08587646484375, 0.0894775390625, 0.09307861328125, 0.0966796875, 0.10028076171875, 0.1038818359375, 0.10748291015625, 0.111083984375, 0.11468505859375, 0.1182861328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 8.0, 9.0, 20.0, 52.0, 130.0, 204.0, 296.0, 180.0, 64.0, 26.0, 9.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9999528527259827, -0.9723597764968872, -0.9447667598724365, -0.9171736836433411, -0.8895806670188904, -0.8619875907897949, -0.8343945741653442, -0.8068014979362488, -0.7792084217071533, -0.7516153454780579, -0.7240223288536072, -0.6964292526245117, -0.668836236000061, -0.6412431597709656, -0.6136500835418701, -0.5860570669174194, -0.5584640502929688, -0.5308709740638733, -0.5032779574394226, -0.47568488121032715, -0.44809186458587646, -0.420498788356781, -0.39290574193000793, -0.36531269550323486, -0.3377196490764618, -0.3101266026496887, -0.28253355622291565, -0.2549405097961426, -0.2273474484682083, -0.19975440204143524, -0.17216134071350098, -0.1445682942867279, -0.11697518825531006, -0.08938214182853699, -0.06178908795118332, -0.03419603407382965, -0.00660298764705658, 0.02099005877971649, 0.04858312010765076, 0.07617616653442383, 0.1037692129611969, 0.13136225938796997, 0.15895530581474304, 0.1865483671426773, 0.21414141356945038, 0.24173445999622345, 0.2693275213241577, 0.2969205677509308, 0.32451361417770386, 0.35210666060447693, 0.37969970703125, 0.40729278326034546, 0.43488579988479614, 0.4624788761138916, 0.4900719225406647, 0.5176649689674377, 0.5452580451965332, 0.5728511214256287, 0.6004441380500793, 0.6280372142791748, 0.6556302309036255, 0.683223307132721, 0.7108163833618164, 0.7384093999862671, 0.7660024166107178]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 3.0, 1.0, 3.0, 6.0, 3.0, 7.0, 11.0, 6.0, 15.0, 10.0, 21.0, 20.0, 23.0, 17.0, 30.0, 28.0, 36.0, 31.0, 36.0, 41.0, 46.0, 41.0, 29.0, 34.0, 27.0, 42.0, 48.0, 47.0, 42.0, 32.0, 37.0, 32.0, 25.0, 25.0, 17.0, 24.0, 23.0, 17.0, 12.0, 14.0, 15.0, 13.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2007693648338318, -0.19360747933387756, -0.18644557893276215, -0.17928369343280792, -0.1721217930316925, -0.16495990753173828, -0.15779802203178406, -0.15063613653182983, -0.14347423613071442, -0.1363123506307602, -0.12915045022964478, -0.12198856472969055, -0.11482667177915573, -0.10766477882862091, -0.10050289332866669, -0.09334100037813187, -0.08617910742759705, -0.07901721447706223, -0.0718553215265274, -0.06469343602657318, -0.05753154307603836, -0.05036965012550354, -0.04320776090025902, -0.036045871675014496, -0.028883978724479675, -0.021722087636590004, -0.014560196548700333, -0.007398305460810661, -0.00023641437292099, 0.006925478577613831, 0.014087367802858353, 0.021249257028102875, 0.028411149978637695, 0.035573042929172516, 0.04273493215441704, 0.04989682137966156, 0.05705871433019638, 0.0642206072807312, 0.07138249278068542, 0.07854438573122025, 0.08570627868175507, 0.09286817163228989, 0.10003006458282471, 0.10719195008277893, 0.11435384303331375, 0.12151573598384857, 0.1286776214838028, 0.1358395218849182, 0.14300140738487244, 0.15016329288482666, 0.15732519328594208, 0.1644870787858963, 0.17164897918701172, 0.17881086468696594, 0.18597275018692017, 0.1931346356868744, 0.2002965360879898, 0.20745842158794403, 0.21462032198905945, 0.22178220748901367, 0.2289440929889679, 0.2361059933900833, 0.24326787889003754, 0.25042977929115295, 0.2575916647911072]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 7.0, 17.0, 20.0, 21.0, 33.0, 37.0, 66.0, 103.0, 121.0, 198.0, 293.0, 484.0, 805.0, 1490.0, 3006.0, 6824.0, 17347.0, 48636.0, 141736.0, 347567.0, 302193.0, 113018.0, 38807.0, 14167.0, 5703.0, 2591.0, 1288.0, 716.0, 420.0, 256.0, 159.0, 103.0, 84.0, 53.0, 42.0, 37.0, 33.0, 22.0, 7.0, 9.0, 8.0, 4.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.11199951171875, -0.10869503021240234, -0.10539054870605469, -0.10208606719970703, -0.09878158569335938, -0.09547710418701172, -0.09217262268066406, -0.0888681411743164, -0.08556365966796875, -0.0822591781616211, -0.07895469665527344, -0.07565021514892578, -0.07234573364257812, -0.06904125213623047, -0.06573677062988281, -0.062432289123535156, -0.0591278076171875, -0.055823326110839844, -0.05251884460449219, -0.04921436309814453, -0.045909881591796875, -0.04260540008544922, -0.03930091857910156, -0.035996437072753906, -0.03269195556640625, -0.029387474060058594, -0.026082992553710938, -0.02277851104736328, -0.019474029541015625, -0.01616954803466797, -0.012865066528320312, -0.009560585021972656, -0.006256103515625, -0.0029516220092773438, 0.0003528594970703125, 0.0036573410034179688, 0.006961822509765625, 0.010266304016113281, 0.013570785522460938, 0.016875267028808594, 0.02017974853515625, 0.023484230041503906, 0.026788711547851562, 0.03009319305419922, 0.033397674560546875, 0.03670215606689453, 0.04000663757324219, 0.043311119079589844, 0.0466156005859375, 0.049920082092285156, 0.05322456359863281, 0.05652904510498047, 0.059833526611328125, 0.06313800811767578, 0.06644248962402344, 0.0697469711303711, 0.07305145263671875, 0.0763559341430664, 0.07966041564941406, 0.08296489715576172, 0.08626937866210938, 0.08957386016845703, 0.09287834167480469, 0.09618282318115234, 0.0994873046875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 16.0, 26.0, 37.0, 54.0, 56.0, 72.0, 86.0, 100.0, 113.0, 92.0, 97.0, 83.0, 51.0, 42.0, 24.0, 19.0, 13.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0968017578125, -0.09396648406982422, -0.09113121032714844, -0.08829593658447266, -0.08546066284179688, -0.0826253890991211, -0.07979011535644531, -0.07695484161376953, -0.07411956787109375, -0.07128429412841797, -0.06844902038574219, -0.0656137466430664, -0.06277847290039062, -0.059943199157714844, -0.05710792541503906, -0.05427265167236328, -0.0514373779296875, -0.04860210418701172, -0.04576683044433594, -0.042931556701660156, -0.040096282958984375, -0.037261009216308594, -0.03442573547363281, -0.03159046173095703, -0.02875518798828125, -0.02591991424560547, -0.023084640502929688, -0.020249366760253906, -0.017414093017578125, -0.014578819274902344, -0.011743545532226562, -0.008908271789550781, -0.006072998046875, -0.0032377243041992188, -0.0004024505615234375, 0.0024328231811523438, 0.005268096923828125, 0.008103370666503906, 0.010938644409179688, 0.013773918151855469, 0.01660919189453125, 0.01944446563720703, 0.022279739379882812, 0.025115013122558594, 0.027950286865234375, 0.030785560607910156, 0.03362083435058594, 0.03645610809326172, 0.0392913818359375, 0.04212665557861328, 0.04496192932128906, 0.047797203063964844, 0.050632476806640625, 0.053467750549316406, 0.05630302429199219, 0.05913829803466797, 0.06197357177734375, 0.06480884552001953, 0.06764411926269531, 0.0704793930053711, 0.07331466674804688, 0.07614994049072266, 0.07898521423339844, 0.08182048797607422, 0.08465576171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 3.0, 3.0, 9.0, 10.0, 14.0, 16.0, 24.0, 21.0, 23.0, 34.0, 45.0, 76.0, 86.0, 138.0, 223.0, 305.0, 488.0, 891.0, 1903.0, 4685.0, 14265.0, 52625.0, 219117.0, 488778.0, 196109.0, 47154.0, 12906.0, 4389.0, 1681.0, 904.0, 497.0, 337.0, 204.0, 151.0, 109.0, 83.0, 66.0, 36.0, 28.0, 16.0, 26.0, 15.0, 13.0, 5.0, 7.0, 10.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0], "bins": [-0.1142578125, -0.11073780059814453, -0.10721778869628906, -0.1036977767944336, -0.10017776489257812, -0.09665775299072266, -0.09313774108886719, -0.08961772918701172, -0.08609771728515625, -0.08257770538330078, -0.07905769348144531, -0.07553768157958984, -0.07201766967773438, -0.0684976577758789, -0.06497764587402344, -0.06145763397216797, -0.0579376220703125, -0.05441761016845703, -0.05089759826660156, -0.047377586364746094, -0.043857574462890625, -0.040337562561035156, -0.03681755065917969, -0.03329753875732422, -0.02977752685546875, -0.02625751495361328, -0.022737503051757812, -0.019217491149902344, -0.015697479248046875, -0.012177467346191406, -0.008657455444335938, -0.005137443542480469, -0.001617431640625, 0.0019025802612304688, 0.0054225921630859375, 0.008942604064941406, 0.012462615966796875, 0.015982627868652344, 0.019502639770507812, 0.02302265167236328, 0.02654266357421875, 0.03006267547607422, 0.03358268737792969, 0.037102699279785156, 0.040622711181640625, 0.044142723083496094, 0.04766273498535156, 0.05118274688720703, 0.0547027587890625, 0.05822277069091797, 0.06174278259277344, 0.0652627944946289, 0.06878280639648438, 0.07230281829833984, 0.07582283020019531, 0.07934284210205078, 0.08286285400390625, 0.08638286590576172, 0.08990287780761719, 0.09342288970947266, 0.09694290161132812, 0.1004629135131836, 0.10398292541503906, 0.10750293731689453, 0.11102294921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 7.0, 3.0, 8.0, 8.0, 10.0, 11.0, 12.0, 20.0, 11.0, 28.0, 36.0, 37.0, 26.0, 38.0, 34.0, 40.0, 34.0, 50.0, 40.0, 49.0, 45.0, 45.0, 45.0, 39.0, 39.0, 44.0, 28.0, 20.0, 35.0, 25.0, 18.0, 23.0, 16.0, 17.0, 7.0, 10.0, 10.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.1102294921875, -0.10703182220458984, -0.10383415222167969, -0.10063648223876953, -0.09743881225585938, -0.09424114227294922, -0.09104347229003906, -0.0878458023071289, -0.08464813232421875, -0.0814504623413086, -0.07825279235839844, -0.07505512237548828, -0.07185745239257812, -0.06865978240966797, -0.06546211242675781, -0.062264442443847656, -0.0590667724609375, -0.055869102478027344, -0.05267143249511719, -0.04947376251220703, -0.046276092529296875, -0.04307842254638672, -0.03988075256347656, -0.036683082580566406, -0.03348541259765625, -0.030287742614746094, -0.027090072631835938, -0.02389240264892578, -0.020694732666015625, -0.01749706268310547, -0.014299392700195312, -0.011101722717285156, -0.007904052734375, -0.004706382751464844, -0.0015087127685546875, 0.0016889572143554688, 0.004886627197265625, 0.008084297180175781, 0.011281967163085938, 0.014479637145996094, 0.01767730712890625, 0.020874977111816406, 0.024072647094726562, 0.02727031707763672, 0.030467987060546875, 0.03366565704345703, 0.03686332702636719, 0.040060997009277344, 0.0432586669921875, 0.046456336975097656, 0.04965400695800781, 0.05285167694091797, 0.056049346923828125, 0.05924701690673828, 0.06244468688964844, 0.0656423568725586, 0.06884002685546875, 0.0720376968383789, 0.07523536682128906, 0.07843303680419922, 0.08163070678710938, 0.08482837677001953, 0.08802604675292969, 0.09122371673583984, 0.09442138671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 10.0, 16.0, 18.0, 23.0, 38.0, 85.0, 108.0, 231.0, 371.0, 678.0, 1218.0, 2523.0, 5370.0, 13942.0, 43310.0, 165735.0, 474296.0, 245864.0, 62196.0, 19023.0, 7066.0, 3098.0, 1502.0, 786.0, 404.0, 221.0, 163.0, 76.0, 58.0, 36.0, 16.0, 15.0, 12.0, 12.0, 6.0, 9.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.031402587890625, -0.030440568923950195, -0.02947854995727539, -0.028516530990600586, -0.02755451202392578, -0.026592493057250977, -0.025630474090576172, -0.024668455123901367, -0.023706436157226562, -0.022744417190551758, -0.021782398223876953, -0.02082037925720215, -0.019858360290527344, -0.01889634132385254, -0.017934322357177734, -0.01697230339050293, -0.016010284423828125, -0.01504826545715332, -0.014086246490478516, -0.013124227523803711, -0.012162208557128906, -0.011200189590454102, -0.010238170623779297, -0.009276151657104492, -0.008314132690429688, -0.007352113723754883, -0.006390094757080078, -0.0054280757904052734, -0.004466056823730469, -0.003504037857055664, -0.0025420188903808594, -0.0015799999237060547, -0.00061798095703125, 0.0003440380096435547, 0.0013060569763183594, 0.002268075942993164, 0.0032300949096679688, 0.0041921138763427734, 0.005154132843017578, 0.006116151809692383, 0.0070781707763671875, 0.008040189743041992, 0.009002208709716797, 0.009964227676391602, 0.010926246643066406, 0.011888265609741211, 0.012850284576416016, 0.01381230354309082, 0.014774322509765625, 0.01573634147644043, 0.016698360443115234, 0.01766037940979004, 0.018622398376464844, 0.01958441734313965, 0.020546436309814453, 0.021508455276489258, 0.022470474243164062, 0.023432493209838867, 0.024394512176513672, 0.025356531143188477, 0.02631855010986328, 0.027280569076538086, 0.02824258804321289, 0.029204607009887695, 0.0301666259765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 11.0, 10.0, 14.0, 23.0, 37.0, 32.0, 46.0, 53.0, 39.0, 57.0, 73.0, 70.0, 68.0, 76.0, 64.0, 51.0, 48.0, 48.0, 30.0, 27.0, 22.0, 20.0, 9.0, 13.0, 5.0, 7.0, 6.0, 0.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.298324584960938e-06, -9.008683264255524e-06, -8.71904194355011e-06, -8.429400622844696e-06, -8.139759302139282e-06, -7.850117981433868e-06, -7.560476660728455e-06, -7.270835340023041e-06, -6.981194019317627e-06, -6.691552698612213e-06, -6.401911377906799e-06, -6.1122700572013855e-06, -5.822628736495972e-06, -5.532987415790558e-06, -5.243346095085144e-06, -4.95370477437973e-06, -4.664063453674316e-06, -4.374422132968903e-06, -4.084780812263489e-06, -3.795139491558075e-06, -3.505498170852661e-06, -3.2158568501472473e-06, -2.9262155294418335e-06, -2.6365742087364197e-06, -2.346932888031006e-06, -2.057291567325592e-06, -1.7676502466201782e-06, -1.4780089259147644e-06, -1.1883676052093506e-06, -8.987262845039368e-07, -6.09084963798523e-07, -3.1944364309310913e-07, -2.9802322387695312e-08, 2.598389983177185e-07, 5.494803190231323e-07, 8.391216397285461e-07, 1.12876296043396e-06, 1.4184042811393738e-06, 1.7080456018447876e-06, 1.9976869225502014e-06, 2.2873282432556152e-06, 2.576969563961029e-06, 2.866610884666443e-06, 3.1562522053718567e-06, 3.4458935260772705e-06, 3.7355348467826843e-06, 4.025176167488098e-06, 4.314817488193512e-06, 4.604458808898926e-06, 4.89410012960434e-06, 5.183741450309753e-06, 5.473382771015167e-06, 5.763024091720581e-06, 6.052665412425995e-06, 6.342306733131409e-06, 6.6319480538368225e-06, 6.921589374542236e-06, 7.21123069524765e-06, 7.500872015953064e-06, 7.790513336658478e-06, 8.080154657363892e-06, 8.369795978069305e-06, 8.65943729877472e-06, 8.949078619480133e-06, 9.238719940185547e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 3.0, 17.0, 16.0, 36.0, 38.0, 61.0, 84.0, 123.0, 233.0, 388.0, 749.0, 1421.0, 2778.0, 5837.0, 14378.0, 43116.0, 188509.0, 533795.0, 187811.0, 42888.0, 14449.0, 5832.0, 2798.0, 1420.0, 745.0, 397.0, 231.0, 138.0, 94.0, 51.0, 37.0, 22.0, 22.0, 12.0, 5.0, 7.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032440185546875, -0.03126049041748047, -0.030080795288085938, -0.028901100158691406, -0.027721405029296875, -0.026541709899902344, -0.025362014770507812, -0.02418231964111328, -0.02300262451171875, -0.02182292938232422, -0.020643234252929688, -0.019463539123535156, -0.018283843994140625, -0.017104148864746094, -0.015924453735351562, -0.014744758605957031, -0.0135650634765625, -0.012385368347167969, -0.011205673217773438, -0.010025978088378906, -0.008846282958984375, -0.007666587829589844, -0.0064868927001953125, -0.005307197570800781, -0.00412750244140625, -0.0029478073120117188, -0.0017681121826171875, -0.0005884170532226562, 0.000591278076171875, 0.0017709732055664062, 0.0029506683349609375, 0.004130363464355469, 0.00531005859375, 0.006489753723144531, 0.0076694488525390625, 0.008849143981933594, 0.010028839111328125, 0.011208534240722656, 0.012388229370117188, 0.013567924499511719, 0.01474761962890625, 0.01592731475830078, 0.017107009887695312, 0.018286705017089844, 0.019466400146484375, 0.020646095275878906, 0.021825790405273438, 0.02300548553466797, 0.0241851806640625, 0.02536487579345703, 0.026544570922851562, 0.027724266052246094, 0.028903961181640625, 0.030083656311035156, 0.03126335144042969, 0.03244304656982422, 0.03362274169921875, 0.03480243682861328, 0.03598213195800781, 0.037161827087402344, 0.038341522216796875, 0.039521217346191406, 0.04070091247558594, 0.04188060760498047, 0.043060302734375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 19.0, 19.0, 16.0, 21.0, 25.0, 42.0, 58.0, 78.0, 75.0, 88.0, 90.0, 81.0, 79.0, 55.0, 63.0, 38.0, 24.0, 22.0, 18.0, 15.0, 13.0, 5.0, 8.0, 2.0, 2.0, 2.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0206451416015625, -0.019794702529907227, -0.018944263458251953, -0.01809382438659668, -0.017243385314941406, -0.016392946243286133, -0.01554250717163086, -0.014692068099975586, -0.013841629028320312, -0.012991189956665039, -0.012140750885009766, -0.011290311813354492, -0.010439872741699219, -0.009589433670043945, -0.008738994598388672, -0.007888555526733398, -0.007038116455078125, -0.0061876773834228516, -0.005337238311767578, -0.004486799240112305, -0.0036363601684570312, -0.002785921096801758, -0.0019354820251464844, -0.001085042953491211, -0.0002346038818359375, 0.0006158351898193359, 0.0014662742614746094, 0.002316713333129883, 0.0031671524047851562, 0.00401759147644043, 0.004868030548095703, 0.0057184696197509766, 0.00656890869140625, 0.0074193477630615234, 0.008269786834716797, 0.00912022590637207, 0.009970664978027344, 0.010821104049682617, 0.01167154312133789, 0.012521982192993164, 0.013372421264648438, 0.014222860336303711, 0.015073299407958984, 0.015923738479614258, 0.01677417755126953, 0.017624616622924805, 0.018475055694580078, 0.01932549476623535, 0.020175933837890625, 0.0210263729095459, 0.021876811981201172, 0.022727251052856445, 0.02357769012451172, 0.024428129196166992, 0.025278568267822266, 0.02612900733947754, 0.026979446411132812, 0.027829885482788086, 0.02868032455444336, 0.029530763626098633, 0.030381202697753906, 0.03123164176940918, 0.03208208084106445, 0.03293251991271973, 0.033782958984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 14.0, 24.0, 63.0, 115.0, 159.0, 206.0, 174.0, 115.0, 53.0, 36.0, 11.0, 11.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4796094596385956, -0.4638553857803345, -0.44810131192207336, -0.43234723806381226, -0.41659319400787354, -0.4008391201496124, -0.3850850462913513, -0.3693309724330902, -0.3535768985748291, -0.337822824716568, -0.3220687508583069, -0.30631470680236816, -0.29056063294410706, -0.27480655908584595, -0.25905248522758484, -0.24329841136932373, -0.227544367313385, -0.2117902934551239, -0.196036234498024, -0.18028216063976288, -0.16452810168266296, -0.14877402782440186, -0.13301995396614075, -0.11726588755846024, -0.10151182115077972, -0.08575775474309921, -0.0700036883354187, -0.05424961447715759, -0.03849554806947708, -0.02274148166179657, -0.006987407803535461, 0.00876665860414505, 0.024520695209503174, 0.040274761617183685, 0.056028831750154495, 0.0717829018831253, 0.08753696829080582, 0.10329103469848633, 0.11904510855674744, 0.13479918241500854, 0.15055324137210846, 0.16630731523036957, 0.18206137418746948, 0.1978154480457306, 0.2135695219039917, 0.2293235808610916, 0.24507765471935272, 0.26083171367645264, 0.27658578753471375, 0.29233986139297485, 0.30809393525123596, 0.32384800910949707, 0.3396020531654358, 0.3553561270236969, 0.371110200881958, 0.3868642747402191, 0.4026183485984802, 0.41837242245674133, 0.43412649631500244, 0.44988054037094116, 0.46563461422920227, 0.4813886880874634, 0.4971427619457245, 0.5128968358039856, 0.5286508798599243]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 10.0, 9.0, 11.0, 11.0, 11.0, 13.0, 14.0, 13.0, 26.0, 26.0, 25.0, 27.0, 29.0, 30.0, 36.0, 38.0, 37.0, 34.0, 39.0, 47.0, 29.0, 43.0, 44.0, 39.0, 38.0, 32.0, 28.0, 30.0, 30.0, 24.0, 28.0, 24.0, 20.0, 17.0, 7.0, 20.0, 9.0, 11.0, 3.0, 14.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.25301098823547363, -0.24512891471385956, -0.23724684119224548, -0.2293647676706314, -0.22148269414901733, -0.21360062062740326, -0.20571854710578918, -0.19783645868301392, -0.18995440006256104, -0.18207232654094696, -0.17419025301933289, -0.1663081794977188, -0.15842610597610474, -0.15054403245449066, -0.1426619589328766, -0.13477987051010132, -0.12689779698848724, -0.11901572346687317, -0.1111336499452591, -0.10325157642364502, -0.09536950290203094, -0.08748742938041687, -0.0796053484082222, -0.07172327488660812, -0.06384120136499405, -0.055959127843379974, -0.0480770543217659, -0.040194977074861526, -0.03231290355324745, -0.024430830031633377, -0.016548752784729004, -0.00866667926311493, -0.0007846057415008545, 0.007097468711435795, 0.014979543164372444, 0.022861618548631668, 0.030743692070245743, 0.03862576559185982, 0.04650784283876419, 0.054389916360378265, 0.06227198988199234, 0.07015406340360641, 0.07803613692522049, 0.08591821789741516, 0.09380029141902924, 0.10168236494064331, 0.10956443846225739, 0.11744651198387146, 0.12532858550548553, 0.1332106590270996, 0.14109273254871368, 0.14897480607032776, 0.15685687959194183, 0.1647389531135559, 0.17262104153633118, 0.18050310015678406, 0.18838518857955933, 0.1962672621011734, 0.20414933562278748, 0.21203140914440155, 0.21991348266601562, 0.2277955561876297, 0.23567762970924377, 0.24355971813201904, 0.2514417767524719]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 15.0, 9.0, 21.0, 43.0, 77.0, 132.0, 274.0, 664.0, 1915.0, 7713.0, 46663.0, 1042178.0, 2941893.0, 133717.0, 14708.0, 2786.0, 837.0, 301.0, 154.0, 93.0, 43.0, 23.0, 12.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1365966796875, -0.13248252868652344, -0.12836837768554688, -0.12425422668457031, -0.12014007568359375, -0.11602592468261719, -0.11191177368164062, -0.10779762268066406, -0.1036834716796875, -0.09956932067871094, -0.09545516967773438, -0.09134101867675781, -0.08722686767578125, -0.08311271667480469, -0.07899856567382812, -0.07488441467285156, -0.070770263671875, -0.06665611267089844, -0.06254196166992188, -0.05842781066894531, -0.05431365966796875, -0.05019950866699219, -0.046085357666015625, -0.04197120666503906, -0.0378570556640625, -0.03374290466308594, -0.029628753662109375, -0.025514602661132812, -0.02140045166015625, -0.017286300659179688, -0.013172149658203125, -0.009057998657226562, -0.00494384765625, -0.0008296966552734375, 0.003284454345703125, 0.0073986053466796875, 0.01151275634765625, 0.015626907348632812, 0.019741058349609375, 0.023855209350585938, 0.0279693603515625, 0.03208351135253906, 0.036197662353515625, 0.04031181335449219, 0.04442596435546875, 0.04854011535644531, 0.052654266357421875, 0.05676841735839844, 0.060882568359375, 0.06499671936035156, 0.06911087036132812, 0.07322502136230469, 0.07733917236328125, 0.08145332336425781, 0.08556747436523438, 0.08968162536621094, 0.0937957763671875, 0.09790992736816406, 0.10202407836914062, 0.10613822937011719, 0.11025238037109375, 0.11436653137207031, 0.11848068237304688, 0.12259483337402344, 0.126708984375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 12.0, 19.0, 18.0, 34.0, 37.0, 63.0, 78.0, 93.0, 96.0, 99.0, 98.0, 103.0, 77.0, 49.0, 46.0, 33.0, 12.0, 12.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09820556640625, -0.0953378677368164, -0.09247016906738281, -0.08960247039794922, -0.08673477172851562, -0.08386707305908203, -0.08099937438964844, -0.07813167572021484, -0.07526397705078125, -0.07239627838134766, -0.06952857971191406, -0.06666088104248047, -0.06379318237304688, -0.06092548370361328, -0.05805778503417969, -0.055190086364746094, -0.0523223876953125, -0.049454689025878906, -0.04658699035644531, -0.04371929168701172, -0.040851593017578125, -0.03798389434814453, -0.03511619567871094, -0.032248497009277344, -0.02938079833984375, -0.026513099670410156, -0.023645401000976562, -0.02077770233154297, -0.017910003662109375, -0.015042304992675781, -0.012174606323242188, -0.009306907653808594, -0.006439208984375, -0.0035715103149414062, -0.0007038116455078125, 0.0021638870239257812, 0.005031585693359375, 0.007899284362792969, 0.010766983032226562, 0.013634681701660156, 0.01650238037109375, 0.019370079040527344, 0.022237777709960938, 0.02510547637939453, 0.027973175048828125, 0.03084087371826172, 0.03370857238769531, 0.036576271057128906, 0.0394439697265625, 0.042311668395996094, 0.04517936706542969, 0.04804706573486328, 0.050914764404296875, 0.05378246307373047, 0.05665016174316406, 0.059517860412597656, 0.06238555908203125, 0.06525325775146484, 0.06812095642089844, 0.07098865509033203, 0.07385635375976562, 0.07672405242919922, 0.07959175109863281, 0.0824594497680664, 0.0853271484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 4.0, 11.0, 22.0, 45.0, 56.0, 96.0, 174.0, 294.0, 588.0, 1582.0, 6360.0, 46620.0, 1053610.0, 2966101.0, 104019.0, 10852.0, 2256.0, 754.0, 359.0, 161.0, 129.0, 75.0, 45.0, 32.0, 11.0, 10.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.1276226043701172, -0.12365341186523438, -0.11968421936035156, -0.11571502685546875, -0.11174583435058594, -0.10777664184570312, -0.10380744934082031, -0.0998382568359375, -0.09586906433105469, -0.09189987182617188, -0.08793067932128906, -0.08396148681640625, -0.07999229431152344, -0.07602310180664062, -0.07205390930175781, -0.068084716796875, -0.06411552429199219, -0.060146331787109375, -0.05617713928222656, -0.05220794677734375, -0.04823875427246094, -0.044269561767578125, -0.04030036926269531, -0.0363311767578125, -0.03236198425292969, -0.028392791748046875, -0.024423599243164062, -0.02045440673828125, -0.016485214233398438, -0.012516021728515625, -0.008546829223632812, -0.00457763671875, -0.0006084442138671875, 0.003360748291015625, 0.0073299407958984375, 0.01129913330078125, 0.015268325805664062, 0.019237518310546875, 0.023206710815429688, 0.0271759033203125, 0.031145095825195312, 0.035114288330078125, 0.03908348083496094, 0.04305267333984375, 0.04702186584472656, 0.050991058349609375, 0.05496025085449219, 0.058929443359375, 0.06289863586425781, 0.06686782836914062, 0.07083702087402344, 0.07480621337890625, 0.07877540588378906, 0.08274459838867188, 0.08671379089355469, 0.0906829833984375, 0.09465217590332031, 0.09862136840820312, 0.10259056091308594, 0.10655975341796875, 0.11052894592285156, 0.11449813842773438, 0.11846733093261719, 0.1224365234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 7.0, 10.0, 22.0, 18.0, 20.0, 35.0, 43.0, 73.0, 86.0, 140.0, 197.0, 397.0, 602.0, 724.0, 626.0, 382.0, 230.0, 121.0, 81.0, 68.0, 44.0, 45.0, 19.0, 13.0, 16.0, 13.0, 11.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07366943359375, -0.07152938842773438, -0.06938934326171875, -0.06724929809570312, -0.0651092529296875, -0.06296920776367188, -0.06082916259765625, -0.058689117431640625, -0.056549072265625, -0.054409027099609375, -0.05226898193359375, -0.050128936767578125, -0.0479888916015625, -0.045848846435546875, -0.04370880126953125, -0.041568756103515625, -0.0394287109375, -0.037288665771484375, -0.03514862060546875, -0.033008575439453125, -0.0308685302734375, -0.028728485107421875, -0.02658843994140625, -0.024448394775390625, -0.022308349609375, -0.020168304443359375, -0.01802825927734375, -0.015888214111328125, -0.0137481689453125, -0.011608123779296875, -0.00946807861328125, -0.007328033447265625, -0.00518798828125, -0.003047943115234375, -0.00090789794921875, 0.001232147216796875, 0.0033721923828125, 0.005512237548828125, 0.00765228271484375, 0.009792327880859375, 0.011932373046875, 0.014072418212890625, 0.01621246337890625, 0.018352508544921875, 0.0204925537109375, 0.022632598876953125, 0.02477264404296875, 0.026912689208984375, 0.029052734375, 0.031192779541015625, 0.03333282470703125, 0.035472869873046875, 0.0376129150390625, 0.039752960205078125, 0.04189300537109375, 0.044033050537109375, 0.046173095703125, 0.048313140869140625, 0.05045318603515625, 0.052593231201171875, 0.0547332763671875, 0.056873321533203125, 0.05901336669921875, 0.061153411865234375, 0.06329345703125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 2.0, 4.0, 4.0, 42.0, 277.0, 488.0, 164.0, 23.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.072157382965088, -2.0325255393981934, -1.9928934574127197, -1.9532614946365356, -1.9136295318603516, -1.8739975690841675, -1.8343656063079834, -1.7947336435317993, -1.7551016807556152, -1.7154697179794312, -1.675837755203247, -1.636205792427063, -1.596573829650879, -1.5569418668746948, -1.5173099040985107, -1.4776779413223267, -1.4380459785461426, -1.3984140157699585, -1.3587820529937744, -1.3191500902175903, -1.2795181274414062, -1.2398861646652222, -1.200254201889038, -1.160622239112854, -1.1209903955459595, -1.0813584327697754, -1.0417264699935913, -1.0020945072174072, -0.9624625444412231, -0.9228305816650391, -0.883198618888855, -0.8435666561126709, -0.8039346933364868, -0.7643027305603027, -0.7246707677841187, -0.6850388050079346, -0.6454068422317505, -0.6057748794555664, -0.5661429166793823, -0.5265109539031982, -0.48687899112701416, -0.4472470283508301, -0.407615065574646, -0.3679831027984619, -0.32835114002227783, -0.28871917724609375, -0.24908724427223206, -0.20945528149604797, -0.1698233187198639, -0.1301913559436798, -0.09055940061807632, -0.05092744529247284, -0.011295482516288757, 0.028336480259895325, 0.06796842813491821, 0.1076003909111023, 0.14723235368728638, 0.18686431646347046, 0.22649627923965454, 0.2661282420158386, 0.3057602047920227, 0.3453921675682068, 0.3850241005420685, 0.42465606331825256, 0.46428802609443665]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 4.0, 6.0, 8.0, 7.0, 22.0, 15.0, 22.0, 22.0, 30.0, 21.0, 19.0, 24.0, 30.0, 31.0, 34.0, 42.0, 39.0, 37.0, 51.0, 40.0, 46.0, 32.0, 41.0, 48.0, 39.0, 28.0, 28.0, 27.0, 26.0, 24.0, 25.0, 16.0, 17.0, 14.0, 16.0, 11.0, 13.0, 13.0, 4.0, 5.0, 5.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17259842157363892, -0.16733457148075104, -0.16207072138786316, -0.15680688619613647, -0.1515430361032486, -0.14627918601036072, -0.14101535081863403, -0.13575150072574615, -0.13048765063285828, -0.1252238005399704, -0.11995995789766312, -0.11469611525535583, -0.10943226516246796, -0.10416841506958008, -0.0989045724272728, -0.09364072978496552, -0.08837687969207764, -0.08311302959918976, -0.07784918695688248, -0.0725853443145752, -0.06732149422168732, -0.06205764785408974, -0.05679380148649216, -0.05152995511889458, -0.046266108751297, -0.04100226238369942, -0.03573841601610184, -0.030474569648504257, -0.025210723280906677, -0.019946876913309097, -0.014683030545711517, -0.009419184178113937, -0.004155337810516357, 0.0011085085570812225, 0.0063723549246788025, 0.011636201292276382, 0.016900047659873962, 0.022163894027471542, 0.027427740395069122, 0.0326915867626667, 0.03795543313026428, 0.04321927949786186, 0.04848312586545944, 0.05374697223305702, 0.0590108186006546, 0.06427466869354248, 0.06953851133584976, 0.07480235397815704, 0.08006620407104492, 0.0853300541639328, 0.09059389680624008, 0.09585773944854736, 0.10112158954143524, 0.10638543963432312, 0.1116492822766304, 0.11691312491893768, 0.12217697501182556, 0.12744082510471344, 0.13270467519760132, 0.137968510389328, 0.14323236048221588, 0.14849621057510376, 0.15376004576683044, 0.15902389585971832, 0.1642877459526062]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 9.0, 12.0, 9.0, 11.0, 12.0, 22.0, 29.0, 33.0, 40.0, 54.0, 77.0, 105.0, 133.0, 164.0, 316.0, 438.0, 645.0, 1028.0, 2032.0, 4088.0, 9362.0, 24088.0, 63603.0, 159858.0, 301715.0, 269981.0, 127190.0, 49317.0, 18756.0, 7554.0, 3463.0, 1670.0, 874.0, 564.0, 359.0, 236.0, 178.0, 121.0, 94.0, 69.0, 56.0, 47.0, 36.0, 24.0, 19.0, 15.0, 15.0, 10.0, 8.0, 8.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.0703125, -0.06817340850830078, -0.06603431701660156, -0.06389522552490234, -0.061756134033203125, -0.059617042541503906, -0.05747795104980469, -0.05533885955810547, -0.05319976806640625, -0.05106067657470703, -0.04892158508300781, -0.046782493591308594, -0.044643402099609375, -0.042504310607910156, -0.04036521911621094, -0.03822612762451172, -0.0360870361328125, -0.03394794464111328, -0.03180885314941406, -0.029669761657714844, -0.027530670166015625, -0.025391578674316406, -0.023252487182617188, -0.02111339569091797, -0.01897430419921875, -0.01683521270751953, -0.014696121215820312, -0.012557029724121094, -0.010417938232421875, -0.008278846740722656, -0.0061397552490234375, -0.004000663757324219, -0.001861572265625, 0.00027751922607421875, 0.0024166107177734375, 0.004555702209472656, 0.006694793701171875, 0.008833885192871094, 0.010972976684570312, 0.013112068176269531, 0.01525115966796875, 0.01739025115966797, 0.019529342651367188, 0.021668434143066406, 0.023807525634765625, 0.025946617126464844, 0.028085708618164062, 0.03022480010986328, 0.0323638916015625, 0.03450298309326172, 0.03664207458496094, 0.038781166076660156, 0.040920257568359375, 0.043059349060058594, 0.04519844055175781, 0.04733753204345703, 0.04947662353515625, 0.05161571502685547, 0.05375480651855469, 0.055893898010253906, 0.058032989501953125, 0.060172080993652344, 0.06231117248535156, 0.06445026397705078, 0.06658935546875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 13.0, 12.0, 25.0, 35.0, 54.0, 60.0, 71.0, 104.0, 106.0, 134.0, 88.0, 88.0, 59.0, 58.0, 40.0, 25.0, 16.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09454345703125, -0.09176349639892578, -0.08898353576660156, -0.08620357513427734, -0.08342361450195312, -0.0806436538696289, -0.07786369323730469, -0.07508373260498047, -0.07230377197265625, -0.06952381134033203, -0.06674385070800781, -0.0639638900756836, -0.061183929443359375, -0.058403968811035156, -0.05562400817871094, -0.05284404754638672, -0.0500640869140625, -0.04728412628173828, -0.04450416564941406, -0.041724205017089844, -0.038944244384765625, -0.036164283752441406, -0.03338432312011719, -0.03060436248779297, -0.02782440185546875, -0.02504444122314453, -0.022264480590820312, -0.019484519958496094, -0.016704559326171875, -0.013924598693847656, -0.011144638061523438, -0.008364677429199219, -0.005584716796875, -0.0028047561645507812, -2.47955322265625e-05, 0.0027551651000976562, 0.005535125732421875, 0.008315086364746094, 0.011095046997070312, 0.013875007629394531, 0.01665496826171875, 0.01943492889404297, 0.022214889526367188, 0.024994850158691406, 0.027774810791015625, 0.030554771423339844, 0.03333473205566406, 0.03611469268798828, 0.0388946533203125, 0.04167461395263672, 0.04445457458496094, 0.047234535217285156, 0.050014495849609375, 0.052794456481933594, 0.05557441711425781, 0.05835437774658203, 0.06113433837890625, 0.06391429901123047, 0.06669425964355469, 0.0694742202758789, 0.07225418090820312, 0.07503414154052734, 0.07781410217285156, 0.08059406280517578, 0.0833740234375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 6.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 12.0, 10.0, 8.0, 5.0, 17.0, 19.0, 25.0, 38.0, 43.0, 53.0, 99.0, 142.0, 257.0, 486.0, 1221.0, 3462.0, 13196.0, 56469.0, 245189.0, 480627.0, 189541.0, 42594.0, 9969.0, 2831.0, 1017.0, 466.0, 239.0, 128.0, 84.0, 71.0, 46.0, 32.0, 24.0, 17.0, 17.0, 16.0, 15.0, 11.0, 9.0, 7.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.08380126953125, -0.08104515075683594, -0.07828903198242188, -0.07553291320800781, -0.07277679443359375, -0.07002067565917969, -0.06726455688476562, -0.06450843811035156, -0.0617523193359375, -0.05899620056152344, -0.056240081787109375, -0.05348396301269531, -0.05072784423828125, -0.04797172546386719, -0.045215606689453125, -0.04245948791503906, -0.039703369140625, -0.03694725036621094, -0.034191131591796875, -0.03143501281738281, -0.02867889404296875, -0.025922775268554688, -0.023166656494140625, -0.020410537719726562, -0.0176544189453125, -0.014898300170898438, -0.012142181396484375, -0.009386062622070312, -0.00662994384765625, -0.0038738250732421875, -0.001117706298828125, 0.0016384124755859375, 0.00439453125, 0.0071506500244140625, 0.009906768798828125, 0.012662887573242188, 0.01541900634765625, 0.018175125122070312, 0.020931243896484375, 0.023687362670898438, 0.0264434814453125, 0.029199600219726562, 0.031955718994140625, 0.03471183776855469, 0.03746795654296875, 0.04022407531738281, 0.042980194091796875, 0.04573631286621094, 0.048492431640625, 0.05124855041503906, 0.054004669189453125, 0.05676078796386719, 0.05951690673828125, 0.06227302551269531, 0.06502914428710938, 0.06778526306152344, 0.0705413818359375, 0.07329750061035156, 0.07605361938476562, 0.07880973815917969, 0.08156585693359375, 0.08432197570800781, 0.08707809448242188, 0.08983421325683594, 0.09259033203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 1.0, 6.0, 13.0, 21.0, 8.0, 15.0, 14.0, 17.0, 29.0, 16.0, 15.0, 27.0, 36.0, 46.0, 28.0, 36.0, 33.0, 24.0, 31.0, 46.0, 39.0, 44.0, 42.0, 37.0, 44.0, 39.0, 29.0, 25.0, 29.0, 35.0, 27.0, 19.0, 18.0, 15.0, 17.0, 13.0, 10.0, 7.0, 11.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0], "bins": [-0.08245849609375, -0.08009719848632812, -0.07773590087890625, -0.07537460327148438, -0.0730133056640625, -0.07065200805664062, -0.06829071044921875, -0.06592941284179688, -0.063568115234375, -0.061206817626953125, -0.05884552001953125, -0.056484222412109375, -0.0541229248046875, -0.051761627197265625, -0.04940032958984375, -0.047039031982421875, -0.044677734375, -0.042316436767578125, -0.03995513916015625, -0.037593841552734375, -0.0352325439453125, -0.032871246337890625, -0.03050994873046875, -0.028148651123046875, -0.025787353515625, -0.023426055908203125, -0.02106475830078125, -0.018703460693359375, -0.0163421630859375, -0.013980865478515625, -0.01161956787109375, -0.009258270263671875, -0.00689697265625, -0.004535675048828125, -0.00217437744140625, 0.000186920166015625, 0.0025482177734375, 0.004909515380859375, 0.00727081298828125, 0.009632110595703125, 0.011993408203125, 0.014354705810546875, 0.01671600341796875, 0.019077301025390625, 0.0214385986328125, 0.023799896240234375, 0.02616119384765625, 0.028522491455078125, 0.0308837890625, 0.033245086669921875, 0.03560638427734375, 0.037967681884765625, 0.0403289794921875, 0.042690277099609375, 0.04505157470703125, 0.047412872314453125, 0.049774169921875, 0.052135467529296875, 0.05449676513671875, 0.056858062744140625, 0.0592193603515625, 0.061580657958984375, 0.06394195556640625, 0.06630325317382812, 0.06866455078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 4.0, 5.0, 3.0, 5.0, 4.0, 6.0, 10.0, 8.0, 19.0, 20.0, 28.0, 37.0, 49.0, 57.0, 85.0, 104.0, 171.0, 229.0, 466.0, 801.0, 1512.0, 3006.0, 6318.0, 14098.0, 34117.0, 85747.0, 198118.0, 302768.0, 226071.0, 102303.0, 40545.0, 16832.0, 7415.0, 3390.0, 1749.0, 954.0, 534.0, 309.0, 201.0, 111.0, 104.0, 66.0, 43.0, 36.0, 25.0, 20.0, 6.0, 8.0, 12.0, 8.0, 5.0, 3.0, 5.0, 7.0, 2.0, 6.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.016204833984375, -0.01569199562072754, -0.015179157257080078, -0.014666318893432617, -0.014153480529785156, -0.013640642166137695, -0.013127803802490234, -0.012614965438842773, -0.012102127075195312, -0.011589288711547852, -0.01107645034790039, -0.01056361198425293, -0.010050773620605469, -0.009537935256958008, -0.009025096893310547, -0.008512258529663086, -0.007999420166015625, -0.007486581802368164, -0.006973743438720703, -0.006460905075073242, -0.005948066711425781, -0.00543522834777832, -0.004922389984130859, -0.0044095516204833984, -0.0038967132568359375, -0.0033838748931884766, -0.0028710365295410156, -0.0023581981658935547, -0.0018453598022460938, -0.0013325214385986328, -0.0008196830749511719, -0.00030684471130371094, 0.00020599365234375, 0.0007188320159912109, 0.0012316703796386719, 0.0017445087432861328, 0.0022573471069335938, 0.0027701854705810547, 0.0032830238342285156, 0.0037958621978759766, 0.0043087005615234375, 0.0048215389251708984, 0.005334377288818359, 0.00584721565246582, 0.006360054016113281, 0.006872892379760742, 0.007385730743408203, 0.007898569107055664, 0.008411407470703125, 0.008924245834350586, 0.009437084197998047, 0.009949922561645508, 0.010462760925292969, 0.01097559928894043, 0.01148843765258789, 0.012001276016235352, 0.012514114379882812, 0.013026952743530273, 0.013539791107177734, 0.014052629470825195, 0.014565467834472656, 0.015078306198120117, 0.015591144561767578, 0.01610398292541504, 0.0166168212890625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 9.0, 5.0, 8.0, 13.0, 15.0, 17.0, 17.0, 21.0, 22.0, 33.0, 25.0, 33.0, 44.0, 33.0, 66.0, 56.0, 53.0, 50.0, 62.0, 52.0, 51.0, 59.0, 38.0, 27.0, 33.0, 23.0, 23.0, 21.0, 19.0, 14.0, 12.0, 5.0, 5.0, 8.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-06, -7.5018033385276794e-06, -7.255002856254578e-06, -7.008202373981476e-06, -6.761401891708374e-06, -6.514601409435272e-06, -6.26780092716217e-06, -6.021000444889069e-06, -5.774199962615967e-06, -5.527399480342865e-06, -5.280598998069763e-06, -5.033798515796661e-06, -4.7869980335235596e-06, -4.540197551250458e-06, -4.293397068977356e-06, -4.046596586704254e-06, -3.7997961044311523e-06, -3.5529956221580505e-06, -3.3061951398849487e-06, -3.059394657611847e-06, -2.812594175338745e-06, -2.5657936930656433e-06, -2.3189932107925415e-06, -2.0721927285194397e-06, -1.8253922462463379e-06, -1.578591763973236e-06, -1.3317912817001343e-06, -1.0849907994270325e-06, -8.381903171539307e-07, -5.913898348808289e-07, -3.4458935260772705e-07, -9.778887033462524e-08, 1.4901161193847656e-07, 3.9581209421157837e-07, 6.426125764846802e-07, 8.89413058757782e-07, 1.1362135410308838e-06, 1.3830140233039856e-06, 1.6298145055770874e-06, 1.8766149878501892e-06, 2.123415470123291e-06, 2.370215952396393e-06, 2.6170164346694946e-06, 2.8638169169425964e-06, 3.1106173992156982e-06, 3.3574178814888e-06, 3.604218363761902e-06, 3.851018846035004e-06, 4.0978193283081055e-06, 4.344619810581207e-06, 4.591420292854309e-06, 4.838220775127411e-06, 5.085021257400513e-06, 5.3318217396736145e-06, 5.578622221946716e-06, 5.825422704219818e-06, 6.07222318649292e-06, 6.319023668766022e-06, 6.5658241510391235e-06, 6.812624633312225e-06, 7.059425115585327e-06, 7.306225597858429e-06, 7.553026080131531e-06, 7.799826562404633e-06, 8.046627044677734e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 11.0, 17.0, 17.0, 37.0, 25.0, 69.0, 72.0, 120.0, 152.0, 248.0, 344.0, 573.0, 890.0, 1423.0, 2490.0, 4671.0, 8786.0, 17721.0, 37295.0, 79246.0, 154339.0, 233728.0, 225512.0, 142132.0, 70800.0, 33487.0, 15892.0, 8005.0, 4270.0, 2334.0, 1436.0, 843.0, 515.0, 340.0, 221.0, 145.0, 86.0, 58.0, 51.0, 39.0, 33.0, 12.0, 18.0, 15.0, 7.0, 3.0, 9.0, 3.0, 4.0, 2.0, 2.0], "bins": [-0.015472412109375, -0.015029430389404297, -0.014586448669433594, -0.01414346694946289, -0.013700485229492188, -0.013257503509521484, -0.012814521789550781, -0.012371540069580078, -0.011928558349609375, -0.011485576629638672, -0.011042594909667969, -0.010599613189697266, -0.010156631469726562, -0.00971364974975586, -0.009270668029785156, -0.008827686309814453, -0.00838470458984375, -0.007941722869873047, -0.007498741149902344, -0.007055759429931641, -0.0066127777099609375, -0.006169795989990234, -0.005726814270019531, -0.005283832550048828, -0.004840850830078125, -0.004397869110107422, -0.003954887390136719, -0.0035119056701660156, -0.0030689239501953125, -0.0026259422302246094, -0.0021829605102539062, -0.0017399787902832031, -0.0012969970703125, -0.0008540153503417969, -0.00041103363037109375, 3.1948089599609375e-05, 0.0004749298095703125, 0.0009179115295410156, 0.0013608932495117188, 0.0018038749694824219, 0.002246856689453125, 0.002689838409423828, 0.0031328201293945312, 0.0035758018493652344, 0.0040187835693359375, 0.004461765289306641, 0.004904747009277344, 0.005347728729248047, 0.00579071044921875, 0.006233692169189453, 0.006676673889160156, 0.007119655609130859, 0.0075626373291015625, 0.008005619049072266, 0.008448600769042969, 0.008891582489013672, 0.009334564208984375, 0.009777545928955078, 0.010220527648925781, 0.010663509368896484, 0.011106491088867188, 0.01154947280883789, 0.011992454528808594, 0.012435436248779297, 0.01287841796875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 9.0, 8.0, 8.0, 13.0, 21.0, 25.0, 23.0, 37.0, 40.0, 39.0, 57.0, 49.0, 50.0, 61.0, 64.0, 61.0, 54.0, 47.0, 49.0, 38.0, 36.0, 40.0, 34.0, 20.0, 19.0, 21.0, 9.0, 10.0, 16.0, 4.0, 4.0, 2.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0128173828125, -0.012355804443359375, -0.01189422607421875, -0.011432647705078125, -0.0109710693359375, -0.010509490966796875, -0.01004791259765625, -0.009586334228515625, -0.009124755859375, -0.008663177490234375, -0.00820159912109375, -0.007740020751953125, -0.0072784423828125, -0.006816864013671875, -0.00635528564453125, -0.005893707275390625, -0.00543212890625, -0.004970550537109375, -0.00450897216796875, -0.004047393798828125, -0.0035858154296875, -0.003124237060546875, -0.00266265869140625, -0.002201080322265625, -0.001739501953125, -0.001277923583984375, -0.00081634521484375, -0.000354766845703125, 0.0001068115234375, 0.000568389892578125, 0.00102996826171875, 0.001491546630859375, 0.001953125, 0.002414703369140625, 0.00287628173828125, 0.003337860107421875, 0.0037994384765625, 0.004261016845703125, 0.00472259521484375, 0.005184173583984375, 0.005645751953125, 0.006107330322265625, 0.00656890869140625, 0.007030487060546875, 0.0074920654296875, 0.007953643798828125, 0.00841522216796875, 0.008876800537109375, 0.00933837890625, 0.009799957275390625, 0.01026153564453125, 0.010723114013671875, 0.0111846923828125, 0.011646270751953125, 0.01210784912109375, 0.012569427490234375, 0.013031005859375, 0.013492584228515625, 0.01395416259765625, 0.014415740966796875, 0.0148773193359375, 0.015338897705078125, 0.01580047607421875, 0.016262054443359375, 0.0167236328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 11.0, 15.0, 44.0, 118.0, 229.0, 253.0, 157.0, 81.0, 45.0, 19.0, 13.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15779608488082886, -0.14364859461784363, -0.1295011043548584, -0.11535362154245377, -0.10120613127946854, -0.0870586410164833, -0.07291115820407867, -0.058763667941093445, -0.044616177678108215, -0.030468689277768135, -0.016321200877428055, -0.0021737143397331238, 0.011973775923252106, 0.026121266186237335, 0.04026874899864197, 0.0544162392616272, 0.06856372952461243, 0.08271121978759766, 0.09685871005058289, 0.11100619286298752, 0.12515369057655334, 0.13930118083953857, 0.1534486562013626, 0.16759614646434784, 0.18174363672733307, 0.1958911269903183, 0.21003861725330353, 0.22418609261512756, 0.2383335828781128, 0.252481073141098, 0.26662856340408325, 0.2807760536670685, 0.2949235439300537, 0.30907103419303894, 0.32321852445602417, 0.3373660147190094, 0.35151350498199463, 0.36566099524497986, 0.3798084855079651, 0.39395594596862793, 0.40810346603393555, 0.4222509562969208, 0.436398446559906, 0.45054593682289124, 0.46469342708587646, 0.4788409173488617, 0.4929884076118469, 0.5071358680725098, 0.5212833881378174, 0.5354308485984802, 0.5495783686637878, 0.5637258291244507, 0.5778733491897583, 0.5920208096504211, 0.6061683297157288, 0.6203157901763916, 0.6344632506370544, 0.6486107110977173, 0.6627582311630249, 0.6769056916236877, 0.6910532116889954, 0.7052006721496582, 0.7193481922149658, 0.7334956526756287, 0.7476431727409363]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 8.0, 9.0, 7.0, 10.0, 5.0, 13.0, 14.0, 14.0, 25.0, 23.0, 24.0, 29.0, 37.0, 35.0, 31.0, 35.0, 37.0, 33.0, 47.0, 62.0, 42.0, 39.0, 40.0, 46.0, 42.0, 44.0, 22.0, 25.0, 28.0, 28.0, 20.0, 28.0, 12.0, 22.0, 12.0, 16.0, 11.0, 4.0, 3.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.22517025470733643, -0.21760836243629456, -0.2100464552640915, -0.20248456299304962, -0.19492267072200775, -0.1873607635498047, -0.17979887127876282, -0.17223697900772095, -0.16467508673667908, -0.1571131944656372, -0.14955128729343414, -0.14198939502239227, -0.1344275027513504, -0.12686559557914734, -0.11930370330810547, -0.1117418110370636, -0.10417990386486053, -0.09661800414323807, -0.0890561118721962, -0.08149421215057373, -0.07393231987953186, -0.0663704201579094, -0.058808520436286926, -0.05124662443995476, -0.04368472844362259, -0.03612283244729042, -0.028560934588313103, -0.020999036729335785, -0.013437140733003616, -0.005875244736671448, 0.0016866549849510193, 0.009248550981283188, 0.016810446977615356, 0.024372342973947525, 0.031934238970279694, 0.03949613869190216, 0.04705803468823433, 0.0546199306845665, 0.062181830406188965, 0.06974372267723083, 0.0773056223988533, 0.08486752212047577, 0.09242941439151764, 0.0999913141131401, 0.10755321383476257, 0.11511510610580444, 0.12267700582742691, 0.13023890554904938, 0.13780079782009125, 0.14536269009113312, 0.15292459726333618, 0.16048648953437805, 0.16804838180541992, 0.1756102740764618, 0.18317218124866486, 0.19073407351970673, 0.1982959806919098, 0.20585787296295166, 0.21341978013515472, 0.2209816724061966, 0.22854356467723846, 0.23610547184944153, 0.2436673641204834, 0.25122925639152527, 0.25879114866256714]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 11.0, 2.0, 9.0, 6.0, 13.0, 20.0, 26.0, 37.0, 63.0, 95.0, 143.0, 191.0, 346.0, 578.0, 1140.0, 2413.0, 4858.0, 12469.0, 46326.0, 322594.0, 2221195.0, 1367788.0, 168173.0, 29215.0, 8892.0, 3742.0, 1878.0, 919.0, 457.0, 255.0, 145.0, 107.0, 51.0, 53.0, 30.0, 17.0, 18.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.070556640625, -0.0687403678894043, -0.0669240951538086, -0.06510782241821289, -0.06329154968261719, -0.061475276947021484, -0.05965900421142578, -0.05784273147583008, -0.056026458740234375, -0.05421018600463867, -0.05239391326904297, -0.050577640533447266, -0.04876136779785156, -0.04694509506225586, -0.045128822326660156, -0.04331254959106445, -0.04149627685546875, -0.03968000411987305, -0.037863731384277344, -0.03604745864868164, -0.03423118591308594, -0.032414913177490234, -0.03059864044189453, -0.028782367706298828, -0.026966094970703125, -0.025149822235107422, -0.02333354949951172, -0.021517276763916016, -0.019701004028320312, -0.01788473129272461, -0.016068458557128906, -0.014252185821533203, -0.0124359130859375, -0.010619640350341797, -0.008803367614746094, -0.006987094879150391, -0.0051708221435546875, -0.0033545494079589844, -0.0015382766723632812, 0.0002779960632324219, 0.002094268798828125, 0.003910541534423828, 0.005726814270019531, 0.007543087005615234, 0.009359359741210938, 0.01117563247680664, 0.012991905212402344, 0.014808177947998047, 0.01662445068359375, 0.018440723419189453, 0.020256996154785156, 0.02207326889038086, 0.023889541625976562, 0.025705814361572266, 0.02752208709716797, 0.029338359832763672, 0.031154632568359375, 0.03297090530395508, 0.03478717803955078, 0.036603450775146484, 0.03841972351074219, 0.04023599624633789, 0.042052268981933594, 0.0438685417175293, 0.045684814453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 19.0, 19.0, 44.0, 60.0, 84.0, 87.0, 112.0, 105.0, 119.0, 92.0, 79.0, 69.0, 56.0, 23.0, 15.0, 7.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.099853515625, -0.09697246551513672, -0.09409141540527344, -0.09121036529541016, -0.08832931518554688, -0.0854482650756836, -0.08256721496582031, -0.07968616485595703, -0.07680511474609375, -0.07392406463623047, -0.07104301452636719, -0.0681619644165039, -0.06528091430664062, -0.062399864196777344, -0.05951881408691406, -0.05663776397705078, -0.0537567138671875, -0.05087566375732422, -0.04799461364746094, -0.045113563537597656, -0.042232513427734375, -0.039351463317871094, -0.03647041320800781, -0.03358936309814453, -0.03070831298828125, -0.02782726287841797, -0.024946212768554688, -0.022065162658691406, -0.019184112548828125, -0.016303062438964844, -0.013422012329101562, -0.010540962219238281, -0.007659912109375, -0.004778861999511719, -0.0018978118896484375, 0.0009832382202148438, 0.003864288330078125, 0.006745338439941406, 0.009626388549804688, 0.012507438659667969, 0.01538848876953125, 0.01826953887939453, 0.021150588989257812, 0.024031639099121094, 0.026912689208984375, 0.029793739318847656, 0.03267478942871094, 0.03555583953857422, 0.0384368896484375, 0.04131793975830078, 0.04419898986816406, 0.047080039978027344, 0.049961090087890625, 0.052842140197753906, 0.05572319030761719, 0.05860424041748047, 0.06148529052734375, 0.06436634063720703, 0.06724739074707031, 0.0701284408569336, 0.07300949096679688, 0.07589054107666016, 0.07877159118652344, 0.08165264129638672, 0.08453369140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 4.0, 6.0, 13.0, 19.0, 24.0, 39.0, 70.0, 105.0, 175.0, 261.0, 461.0, 834.0, 1794.0, 4048.0, 10854.0, 32493.0, 114242.0, 561208.0, 2498861.0, 767183.0, 141434.0, 38654.0, 12633.0, 4748.0, 1978.0, 900.0, 493.0, 269.0, 158.0, 94.0, 66.0, 41.0, 27.0, 17.0, 21.0, 16.0, 12.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.042327880859375, -0.04094362258911133, -0.039559364318847656, -0.038175106048583984, -0.03679084777832031, -0.03540658950805664, -0.03402233123779297, -0.0326380729675293, -0.031253814697265625, -0.029869556427001953, -0.02848529815673828, -0.02710103988647461, -0.025716781616210938, -0.024332523345947266, -0.022948265075683594, -0.021564006805419922, -0.02017974853515625, -0.018795490264892578, -0.017411231994628906, -0.016026973724365234, -0.014642715454101562, -0.01325845718383789, -0.011874198913574219, -0.010489940643310547, -0.009105682373046875, -0.007721424102783203, -0.006337165832519531, -0.004952907562255859, -0.0035686492919921875, -0.0021843910217285156, -0.0008001327514648438, 0.0005841255187988281, 0.0019683837890625, 0.003352642059326172, 0.004736900329589844, 0.006121158599853516, 0.0075054168701171875, 0.00888967514038086, 0.010273933410644531, 0.011658191680908203, 0.013042449951171875, 0.014426708221435547, 0.01581096649169922, 0.01719522476196289, 0.018579483032226562, 0.019963741302490234, 0.021347999572753906, 0.022732257843017578, 0.02411651611328125, 0.025500774383544922, 0.026885032653808594, 0.028269290924072266, 0.029653549194335938, 0.03103780746459961, 0.03242206573486328, 0.03380632400512695, 0.035190582275390625, 0.0365748405456543, 0.03795909881591797, 0.03934335708618164, 0.04072761535644531, 0.042111873626708984, 0.043496131896972656, 0.04488039016723633, 0.0462646484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 2.0, 7.0, 6.0, 6.0, 10.0, 23.0, 28.0, 24.0, 42.0, 58.0, 63.0, 89.0, 174.0, 255.0, 412.0, 609.0, 654.0, 585.0, 370.0, 236.0, 144.0, 73.0, 55.0, 39.0, 30.0, 17.0, 19.0, 7.0, 11.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.04931640625, -0.04795217514038086, -0.04658794403076172, -0.04522371292114258, -0.04385948181152344, -0.0424952507019043, -0.041131019592285156, -0.039766788482666016, -0.038402557373046875, -0.037038326263427734, -0.035674095153808594, -0.03430986404418945, -0.03294563293457031, -0.03158140182495117, -0.03021717071533203, -0.02885293960571289, -0.02748870849609375, -0.02612447738647461, -0.02476024627685547, -0.023396015167236328, -0.022031784057617188, -0.020667552947998047, -0.019303321838378906, -0.017939090728759766, -0.016574859619140625, -0.015210628509521484, -0.013846397399902344, -0.012482166290283203, -0.011117935180664062, -0.009753704071044922, -0.008389472961425781, -0.007025241851806641, -0.0056610107421875, -0.004296779632568359, -0.0029325485229492188, -0.0015683174133300781, -0.0002040863037109375, 0.0011601448059082031, 0.0025243759155273438, 0.0038886070251464844, 0.005252838134765625, 0.006617069244384766, 0.007981300354003906, 0.009345531463623047, 0.010709762573242188, 0.012073993682861328, 0.013438224792480469, 0.01480245590209961, 0.01616668701171875, 0.01753091812133789, 0.01889514923095703, 0.020259380340576172, 0.021623611450195312, 0.022987842559814453, 0.024352073669433594, 0.025716304779052734, 0.027080535888671875, 0.028444766998291016, 0.029808998107910156, 0.031173229217529297, 0.03253746032714844, 0.03390169143676758, 0.03526592254638672, 0.03663015365600586, 0.037994384765625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 17.0, 62.0, 204.0, 384.0, 269.0, 58.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.075838565826416, -1.0561712980270386, -1.0365040302276611, -1.0168367624282837, -0.9971694946289062, -0.9775022864341736, -0.9578350186347961, -0.9381677508354187, -0.9185004830360413, -0.8988332152366638, -0.8791659474372864, -0.8594986796379089, -0.8398314714431763, -0.8201642036437988, -0.8004969358444214, -0.780829668045044, -0.7611624002456665, -0.7414951324462891, -0.7218278646469116, -0.7021605968475342, -0.6824933290481567, -0.6628261208534241, -0.6431588530540466, -0.6234915852546692, -0.6038243174552917, -0.5841570496559143, -0.5644897818565369, -0.5448225140571594, -0.5251553058624268, -0.5054880380630493, -0.4858207702636719, -0.46615350246429443, -0.446486234664917, -0.42681896686553955, -0.4071516990661621, -0.38748446106910706, -0.3678171932697296, -0.3481499254703522, -0.3284826874732971, -0.3088154196739197, -0.28914815187454224, -0.2694808840751648, -0.24981363117694855, -0.2301463782787323, -0.21047911047935486, -0.19081184267997742, -0.17114458978176117, -0.15147733688354492, -0.13181006908416748, -0.11214280873537064, -0.09247554838657379, -0.07280828803777695, -0.0531410276889801, -0.03347376734018326, -0.013806506991386414, 0.005860745906829834, 0.025528013706207275, 0.04519527405500412, 0.06486253440380096, 0.08452979475259781, 0.10419705510139465, 0.1238643154501915, 0.14353157579898834, 0.1631988286972046, 0.18286609649658203]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 1.0, 10.0, 9.0, 11.0, 14.0, 13.0, 15.0, 29.0, 34.0, 31.0, 36.0, 37.0, 34.0, 55.0, 55.0, 46.0, 60.0, 47.0, 47.0, 39.0, 48.0, 35.0, 46.0, 39.0, 35.0, 28.0, 27.0, 26.0, 26.0, 18.0, 7.0, 7.0, 15.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.16697907447814941, -0.16230547428131104, -0.15763185918331146, -0.15295825898647308, -0.1482846438884735, -0.14361104369163513, -0.13893742859363556, -0.13426382839679718, -0.1295902132987976, -0.12491660565137863, -0.12024299800395966, -0.11556939035654068, -0.1108957827091217, -0.10622218251228333, -0.10154857486486435, -0.09687496721744537, -0.092201367020607, -0.08752775937318802, -0.08285415172576904, -0.07818054407835007, -0.07350693643093109, -0.06883333623409271, -0.06415972858667374, -0.05948612093925476, -0.054812513291835785, -0.05013890564441681, -0.04546529799699783, -0.040791694074869156, -0.03611808642745018, -0.031444478780031204, -0.026770872995257378, -0.02209726721048355, -0.017423659563064575, -0.012750052846968174, -0.008076446130871773, -0.0034028394147753716, 0.0012707673013210297, 0.0059443749487400055, 0.010617980733513832, 0.015291586518287659, 0.019965194165706635, 0.02463880181312561, 0.029312407597899437, 0.033986013382673264, 0.03865962103009224, 0.043333228677511215, 0.04800683259963989, 0.05268044024705887, 0.057354047894477844, 0.06202765554189682, 0.0667012631893158, 0.07137487083673477, 0.07604847848415375, 0.08072207868099213, 0.0853956863284111, 0.09006929397583008, 0.09474290162324905, 0.09941650927066803, 0.104090116918087, 0.10876372456550598, 0.11343732476234436, 0.11811093986034393, 0.12278454005718231, 0.12745815515518188, 0.13213175535202026]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 2.0, 7.0, 8.0, 9.0, 10.0, 20.0, 18.0, 35.0, 34.0, 65.0, 93.0, 127.0, 151.0, 255.0, 350.0, 511.0, 1052.0, 2194.0, 5180.0, 14623.0, 48250.0, 157620.0, 369098.0, 295520.0, 104729.0, 31188.0, 9759.0, 3648.0, 1608.0, 884.0, 471.0, 308.0, 213.0, 136.0, 95.0, 87.0, 47.0, 43.0, 25.0, 25.0, 20.0, 14.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06512451171875, -0.06294059753417969, -0.060756683349609375, -0.05857276916503906, -0.05638885498046875, -0.05420494079589844, -0.052021026611328125, -0.04983711242675781, -0.0476531982421875, -0.04546928405761719, -0.043285369873046875, -0.04110145568847656, -0.03891754150390625, -0.03673362731933594, -0.034549713134765625, -0.03236579895019531, -0.030181884765625, -0.027997970581054688, -0.025814056396484375, -0.023630142211914062, -0.02144622802734375, -0.019262313842773438, -0.017078399658203125, -0.014894485473632812, -0.0127105712890625, -0.010526657104492188, -0.008342742919921875, -0.0061588287353515625, -0.00397491455078125, -0.0017910003662109375, 0.000392913818359375, 0.0025768280029296875, 0.0047607421875, 0.0069446563720703125, 0.009128570556640625, 0.011312484741210938, 0.01349639892578125, 0.015680313110351562, 0.017864227294921875, 0.020048141479492188, 0.0222320556640625, 0.024415969848632812, 0.026599884033203125, 0.028783798217773438, 0.03096771240234375, 0.03315162658691406, 0.035335540771484375, 0.03751945495605469, 0.039703369140625, 0.04188728332519531, 0.044071197509765625, 0.04625511169433594, 0.04843902587890625, 0.05062294006347656, 0.052806854248046875, 0.05499076843261719, 0.0571746826171875, 0.05935859680175781, 0.061542510986328125, 0.06372642517089844, 0.06591033935546875, 0.06809425354003906, 0.07027816772460938, 0.07246208190917969, 0.07464599609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 7.0, 18.0, 28.0, 42.0, 57.0, 58.0, 91.0, 97.0, 122.0, 118.0, 95.0, 73.0, 76.0, 56.0, 32.0, 18.0, 8.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0950927734375, -0.0923614501953125, -0.089630126953125, -0.0868988037109375, -0.08416748046875, -0.0814361572265625, -0.078704833984375, -0.0759735107421875, -0.0732421875, -0.0705108642578125, -0.067779541015625, -0.0650482177734375, -0.06231689453125, -0.0595855712890625, -0.056854248046875, -0.0541229248046875, -0.0513916015625, -0.0486602783203125, -0.045928955078125, -0.0431976318359375, -0.04046630859375, -0.0377349853515625, -0.035003662109375, -0.0322723388671875, -0.029541015625, -0.0268096923828125, -0.024078369140625, -0.0213470458984375, -0.01861572265625, -0.0158843994140625, -0.013153076171875, -0.0104217529296875, -0.0076904296875, -0.0049591064453125, -0.002227783203125, 0.0005035400390625, 0.00323486328125, 0.0059661865234375, 0.008697509765625, 0.0114288330078125, 0.01416015625, 0.0168914794921875, 0.019622802734375, 0.0223541259765625, 0.02508544921875, 0.0278167724609375, 0.030548095703125, 0.0332794189453125, 0.0360107421875, 0.0387420654296875, 0.041473388671875, 0.0442047119140625, 0.04693603515625, 0.0496673583984375, 0.052398681640625, 0.0551300048828125, 0.057861328125, 0.0605926513671875, 0.063323974609375, 0.0660552978515625, 0.06878662109375, 0.0715179443359375, 0.074249267578125, 0.0769805908203125, 0.0797119140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 12.0, 14.0, 20.0, 25.0, 21.0, 51.0, 64.0, 127.0, 245.0, 966.0, 5617.0, 60736.0, 588109.0, 359892.0, 28303.0, 3147.0, 637.0, 219.0, 91.0, 66.0, 39.0, 26.0, 23.0, 18.0, 18.0, 17.0, 19.0, 8.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1197509765625, -0.11586952209472656, -0.11198806762695312, -0.10810661315917969, -0.10422515869140625, -0.10034370422363281, -0.09646224975585938, -0.09258079528808594, -0.0886993408203125, -0.08481788635253906, -0.08093643188476562, -0.07705497741699219, -0.07317352294921875, -0.06929206848144531, -0.06541061401367188, -0.06152915954589844, -0.057647705078125, -0.05376625061035156, -0.049884796142578125, -0.04600334167480469, -0.04212188720703125, -0.03824043273925781, -0.034358978271484375, -0.030477523803710938, -0.0265960693359375, -0.022714614868164062, -0.018833160400390625, -0.014951705932617188, -0.01107025146484375, -0.0071887969970703125, -0.003307342529296875, 0.0005741119384765625, 0.00445556640625, 0.008337020874023438, 0.012218475341796875, 0.016099929809570312, 0.01998138427734375, 0.023862838745117188, 0.027744293212890625, 0.03162574768066406, 0.0355072021484375, 0.03938865661621094, 0.043270111083984375, 0.04715156555175781, 0.05103302001953125, 0.05491447448730469, 0.058795928955078125, 0.06267738342285156, 0.066558837890625, 0.07044029235839844, 0.07432174682617188, 0.07820320129394531, 0.08208465576171875, 0.08596611022949219, 0.08984756469726562, 0.09372901916503906, 0.0976104736328125, 0.10149192810058594, 0.10537338256835938, 0.10925483703613281, 0.11313629150390625, 0.11701774597167969, 0.12089920043945312, 0.12478065490722656, 0.128662109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 12.0, 12.0, 16.0, 10.0, 27.0, 21.0, 21.0, 31.0, 37.0, 46.0, 40.0, 44.0, 50.0, 42.0, 51.0, 68.0, 55.0, 48.0, 44.0, 44.0, 47.0, 43.0, 42.0, 31.0, 28.0, 15.0, 21.0, 16.0, 15.0, 8.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09698486328125, -0.09404468536376953, -0.09110450744628906, -0.0881643295288086, -0.08522415161132812, -0.08228397369384766, -0.07934379577636719, -0.07640361785888672, -0.07346343994140625, -0.07052326202392578, -0.06758308410644531, -0.06464290618896484, -0.061702728271484375, -0.058762550354003906, -0.05582237243652344, -0.05288219451904297, -0.0499420166015625, -0.04700183868408203, -0.04406166076660156, -0.041121482849121094, -0.038181304931640625, -0.035241127014160156, -0.03230094909667969, -0.02936077117919922, -0.02642059326171875, -0.02348041534423828, -0.020540237426757812, -0.017600059509277344, -0.014659881591796875, -0.011719703674316406, -0.008779525756835938, -0.005839347839355469, -0.002899169921875, 4.100799560546875e-05, 0.0029811859130859375, 0.005921363830566406, 0.008861541748046875, 0.011801719665527344, 0.014741897583007812, 0.01768207550048828, 0.02062225341796875, 0.02356243133544922, 0.026502609252929688, 0.029442787170410156, 0.032382965087890625, 0.035323143005371094, 0.03826332092285156, 0.04120349884033203, 0.0441436767578125, 0.04708385467529297, 0.05002403259277344, 0.052964210510253906, 0.055904388427734375, 0.058844566345214844, 0.06178474426269531, 0.06472492218017578, 0.06766510009765625, 0.07060527801513672, 0.07354545593261719, 0.07648563385009766, 0.07942581176757812, 0.0823659896850586, 0.08530616760253906, 0.08824634552001953, 0.0911865234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 10.0, 18.0, 20.0, 41.0, 67.0, 158.0, 314.0, 779.0, 1855.0, 5097.0, 15717.0, 52043.0, 170278.0, 367263.0, 287733.0, 102444.0, 30063.0, 9281.0, 3132.0, 1221.0, 519.0, 227.0, 126.0, 58.0, 31.0, 15.0, 12.0, 12.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0197906494140625, -0.01922154426574707, -0.01865243911743164, -0.01808333396911621, -0.01751422882080078, -0.01694512367248535, -0.016376018524169922, -0.015806913375854492, -0.015237808227539062, -0.014668703079223633, -0.014099597930908203, -0.013530492782592773, -0.012961387634277344, -0.012392282485961914, -0.011823177337646484, -0.011254072189331055, -0.010684967041015625, -0.010115861892700195, -0.009546756744384766, -0.008977651596069336, -0.008408546447753906, -0.007839441299438477, -0.007270336151123047, -0.006701231002807617, -0.0061321258544921875, -0.005563020706176758, -0.004993915557861328, -0.0044248104095458984, -0.0038557052612304688, -0.003286600112915039, -0.0027174949645996094, -0.0021483898162841797, -0.00157928466796875, -0.0010101795196533203, -0.0004410743713378906, 0.00012803077697753906, 0.0006971359252929688, 0.0012662410736083984, 0.0018353462219238281, 0.002404451370239258, 0.0029735565185546875, 0.003542661666870117, 0.004111766815185547, 0.0046808719635009766, 0.005249977111816406, 0.005819082260131836, 0.006388187408447266, 0.006957292556762695, 0.007526397705078125, 0.008095502853393555, 0.008664608001708984, 0.009233713150024414, 0.009802818298339844, 0.010371923446655273, 0.010941028594970703, 0.011510133743286133, 0.012079238891601562, 0.012648344039916992, 0.013217449188232422, 0.013786554336547852, 0.014355659484863281, 0.014924764633178711, 0.01549386978149414, 0.01606297492980957, 0.016632080078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 14.0, 12.0, 16.0, 9.0, 30.0, 23.0, 31.0, 30.0, 41.0, 40.0, 58.0, 42.0, 74.0, 39.0, 57.0, 36.0, 64.0, 58.0, 45.0, 46.0, 35.0, 30.0, 19.0, 33.0, 17.0, 28.0, 10.0, 12.0, 4.0, 8.0, 6.0, 9.0, 5.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4373016357421875e-06, -6.226822733879089e-06, -6.016343832015991e-06, -5.805864930152893e-06, -5.595386028289795e-06, -5.384907126426697e-06, -5.174428224563599e-06, -4.9639493227005005e-06, -4.753470420837402e-06, -4.542991518974304e-06, -4.332512617111206e-06, -4.122033715248108e-06, -3.91155481338501e-06, -3.7010759115219116e-06, -3.4905970096588135e-06, -3.2801181077957153e-06, -3.069639205932617e-06, -2.859160304069519e-06, -2.648681402206421e-06, -2.4382025003433228e-06, -2.2277235984802246e-06, -2.0172446966171265e-06, -1.8067657947540283e-06, -1.5962868928909302e-06, -1.385807991027832e-06, -1.1753290891647339e-06, -9.648501873016357e-07, -7.543712854385376e-07, -5.438923835754395e-07, -3.334134817123413e-07, -1.2293457984924316e-07, 8.754432201385498e-08, 2.980232238769531e-07, 5.085021257400513e-07, 7.189810276031494e-07, 9.294599294662476e-07, 1.1399388313293457e-06, 1.3504177331924438e-06, 1.560896635055542e-06, 1.7713755369186401e-06, 1.9818544387817383e-06, 2.1923333406448364e-06, 2.4028122425079346e-06, 2.6132911443710327e-06, 2.823770046234131e-06, 3.034248948097229e-06, 3.244727849960327e-06, 3.4552067518234253e-06, 3.6656856536865234e-06, 3.876164555549622e-06, 4.08664345741272e-06, 4.297122359275818e-06, 4.507601261138916e-06, 4.718080163002014e-06, 4.928559064865112e-06, 5.1390379667282104e-06, 5.349516868591309e-06, 5.559995770454407e-06, 5.770474672317505e-06, 5.980953574180603e-06, 6.191432476043701e-06, 6.401911377906799e-06, 6.6123902797698975e-06, 6.822869181632996e-06, 7.033348083496094e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 5.0, 7.0, 15.0, 18.0, 30.0, 44.0, 59.0, 123.0, 195.0, 306.0, 593.0, 1122.0, 2278.0, 5329.0, 14112.0, 43278.0, 136356.0, 325222.0, 321068.0, 132848.0, 41916.0, 13833.0, 5189.0, 2154.0, 1098.0, 573.0, 310.0, 166.0, 107.0, 62.0, 44.0, 28.0, 21.0, 13.0, 6.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.02093505859375, -0.020353317260742188, -0.019771575927734375, -0.019189834594726562, -0.01860809326171875, -0.018026351928710938, -0.017444610595703125, -0.016862869262695312, -0.0162811279296875, -0.015699386596679688, -0.015117645263671875, -0.014535903930664062, -0.01395416259765625, -0.013372421264648438, -0.012790679931640625, -0.012208938598632812, -0.011627197265625, -0.011045455932617188, -0.010463714599609375, -0.009881973266601562, -0.00930023193359375, -0.008718490600585938, -0.008136749267578125, -0.0075550079345703125, -0.0069732666015625, -0.0063915252685546875, -0.005809783935546875, -0.0052280426025390625, -0.00464630126953125, -0.0040645599365234375, -0.003482818603515625, -0.0029010772705078125, -0.0023193359375, -0.0017375946044921875, -0.001155853271484375, -0.0005741119384765625, 7.62939453125e-06, 0.0005893707275390625, 0.001171112060546875, 0.0017528533935546875, 0.0023345947265625, 0.0029163360595703125, 0.003498077392578125, 0.0040798187255859375, 0.00466156005859375, 0.0052433013916015625, 0.005825042724609375, 0.0064067840576171875, 0.006988525390625, 0.0075702667236328125, 0.008152008056640625, 0.008733749389648438, 0.00931549072265625, 0.009897232055664062, 0.010478973388671875, 0.011060714721679688, 0.0116424560546875, 0.012224197387695312, 0.012805938720703125, 0.013387680053710938, 0.01396942138671875, 0.014551162719726562, 0.015132904052734375, 0.015714645385742188, 0.01629638671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 7.0, 5.0, 9.0, 16.0, 17.0, 21.0, 26.0, 36.0, 30.0, 36.0, 59.0, 59.0, 77.0, 57.0, 76.0, 65.0, 56.0, 52.0, 43.0, 46.0, 40.0, 32.0, 30.0, 22.0, 18.0, 10.0, 18.0, 7.0, 8.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.01611328125, -0.015616416931152344, -0.015119552612304688, -0.014622688293457031, -0.014125823974609375, -0.013628959655761719, -0.013132095336914062, -0.012635231018066406, -0.01213836669921875, -0.011641502380371094, -0.011144638061523438, -0.010647773742675781, -0.010150909423828125, -0.009654045104980469, -0.009157180786132812, -0.008660316467285156, -0.0081634521484375, -0.007666587829589844, -0.0071697235107421875, -0.006672859191894531, -0.006175994873046875, -0.005679130554199219, -0.0051822662353515625, -0.004685401916503906, -0.00418853759765625, -0.0036916732788085938, -0.0031948089599609375, -0.0026979446411132812, -0.002201080322265625, -0.0017042160034179688, -0.0012073516845703125, -0.0007104873657226562, -0.000213623046875, 0.00028324127197265625, 0.0007801055908203125, 0.0012769699096679688, 0.001773834228515625, 0.0022706985473632812, 0.0027675628662109375, 0.0032644271850585938, 0.00376129150390625, 0.004258155822753906, 0.0047550201416015625, 0.005251884460449219, 0.005748748779296875, 0.006245613098144531, 0.0067424774169921875, 0.007239341735839844, 0.0077362060546875, 0.008233070373535156, 0.008729934692382812, 0.009226799011230469, 0.009723663330078125, 0.010220527648925781, 0.010717391967773438, 0.011214256286621094, 0.01171112060546875, 0.012207984924316406, 0.012704849243164062, 0.013201713562011719, 0.013698577880859375, 0.014195442199707031, 0.014692306518554688, 0.015189170837402344, 0.01568603515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 18.0, 176.0, 599.0, 193.0, 20.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36426013708114624, -0.3296321630477905, -0.2950042188167572, -0.2603762745857239, -0.22574830055236816, -0.19112034142017365, -0.15649238228797913, -0.1218644231557846, -0.08723646402359009, -0.05260850489139557, -0.01798054575920105, 0.01664741337299347, 0.05127537250518799, 0.08590333163738251, 0.12053129076957703, 0.15515924990177155, 0.18978720903396606, 0.22441516816616058, 0.2590431272983551, 0.2936710715293884, 0.32829904556274414, 0.36292701959609985, 0.3975549638271332, 0.4321829080581665, 0.4668108820915222, 0.5014388561248779, 0.5360667705535889, 0.5706947445869446, 0.6053227186203003, 0.639950692653656, 0.6745786666870117, 0.7092065811157227, 0.7438344955444336, 0.7784624695777893, 0.813090443611145, 0.847718358039856, 0.8823463320732117, 0.9169743061065674, 0.9516022205352783, 0.986230194568634, 1.0208581686019897, 1.0554860830307007, 1.0901141166687012, 1.124742031097412, 1.159369945526123, 1.1939979791641235, 1.2286258935928345, 1.263253927230835, 1.297881841659546, 1.3325097560882568, 1.3671377897262573, 1.4017657041549683, 1.4363937377929688, 1.4710216522216797, 1.5056495666503906, 1.5402776002883911, 1.574905514717102, 1.609533429145813, 1.6441614627838135, 1.6787893772125244, 1.7134172916412354, 1.7480453252792358, 1.7826732397079468, 1.8173012733459473, 1.8519291877746582]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 16.0, 13.0, 6.0, 11.0, 13.0, 13.0, 18.0, 24.0, 23.0, 27.0, 40.0, 35.0, 40.0, 32.0, 46.0, 41.0, 43.0, 41.0, 48.0, 38.0, 41.0, 45.0, 36.0, 29.0, 35.0, 30.0, 21.0, 26.0, 17.0, 23.0, 23.0, 19.0, 15.0, 12.0, 10.0, 10.0, 13.0, 10.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.17232096195220947, -0.16597825288772583, -0.159635528922081, -0.15329281985759735, -0.14695009589195251, -0.14060738682746887, -0.13426467776298523, -0.1279219537973404, -0.12157923728227615, -0.11523652076721191, -0.10889380425214767, -0.10255108773708344, -0.09620837867259979, -0.08986565470695496, -0.08352294564247131, -0.07718022912740707, -0.07083751261234283, -0.0644947960972786, -0.058152079582214355, -0.051809366792440414, -0.045466650277376175, -0.039123933762311935, -0.032781220972537994, -0.026438504457473755, -0.020095787942409515, -0.01375307235866785, -0.007410356774926186, -0.0010676421225070953, 0.005275074392557144, 0.011617790907621384, 0.017960503697395325, 0.024303220212459564, 0.030645936727523804, 0.03698865324258804, 0.04333136975765228, 0.049674082547426224, 0.05601679906249046, 0.0623595155775547, 0.06870222836732864, 0.07504494488239288, 0.08138766139745712, 0.08773037791252136, 0.0940730944275856, 0.10041581094264984, 0.10675852000713348, 0.11310124397277832, 0.11944395303726196, 0.1257866621017456, 0.13212938606739044, 0.13847209513187408, 0.14481481909751892, 0.15115752816200256, 0.1575002521276474, 0.16384296119213104, 0.17018568515777588, 0.17652839422225952, 0.18287110328674316, 0.1892138123512268, 0.19555653631687164, 0.20189924538135529, 0.20824196934700012, 0.21458467841148376, 0.2209273874759674, 0.22727011144161224, 0.23361283540725708]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 11.0, 6.0, 17.0, 23.0, 37.0, 47.0, 77.0, 139.0, 214.0, 413.0, 901.0, 2019.0, 4665.0, 14316.0, 89750.0, 1042835.0, 2753834.0, 242958.0, 29410.0, 7360.0, 2829.0, 1238.0, 561.0, 237.0, 125.0, 93.0, 43.0, 33.0, 29.0, 22.0, 15.0, 7.0, 2.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.060546875, -0.05860710144042969, -0.056667327880859375, -0.05472755432128906, -0.05278778076171875, -0.05084800720214844, -0.048908233642578125, -0.04696846008300781, -0.0450286865234375, -0.04308891296386719, -0.041149139404296875, -0.03920936584472656, -0.03726959228515625, -0.03532981872558594, -0.033390045166015625, -0.03145027160644531, -0.029510498046875, -0.027570724487304688, -0.025630950927734375, -0.023691177368164062, -0.02175140380859375, -0.019811630249023438, -0.017871856689453125, -0.015932083129882812, -0.0139923095703125, -0.012052536010742188, -0.010112762451171875, -0.008172988891601562, -0.00623321533203125, -0.0042934417724609375, -0.002353668212890625, -0.0004138946533203125, 0.00152587890625, 0.0034656524658203125, 0.005405426025390625, 0.0073451995849609375, 0.00928497314453125, 0.011224746704101562, 0.013164520263671875, 0.015104293823242188, 0.0170440673828125, 0.018983840942382812, 0.020923614501953125, 0.022863388061523438, 0.02480316162109375, 0.026742935180664062, 0.028682708740234375, 0.030622482299804688, 0.032562255859375, 0.03450202941894531, 0.036441802978515625, 0.03838157653808594, 0.04032135009765625, 0.04226112365722656, 0.044200897216796875, 0.04614067077636719, 0.0480804443359375, 0.05002021789550781, 0.051959991455078125, 0.05389976501464844, 0.05583953857421875, 0.05777931213378906, 0.059719085693359375, 0.06165885925292969, 0.0635986328125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 14.0, 15.0, 27.0, 46.0, 68.0, 86.0, 100.0, 105.0, 119.0, 101.0, 92.0, 85.0, 63.0, 36.0, 20.0, 6.0, 8.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0985107421875, -0.0957174301147461, -0.09292411804199219, -0.09013080596923828, -0.08733749389648438, -0.08454418182373047, -0.08175086975097656, -0.07895755767822266, -0.07616424560546875, -0.07337093353271484, -0.07057762145996094, -0.06778430938720703, -0.06499099731445312, -0.06219768524169922, -0.05940437316894531, -0.056611061096191406, -0.0538177490234375, -0.051024436950683594, -0.04823112487792969, -0.04543781280517578, -0.042644500732421875, -0.03985118865966797, -0.03705787658691406, -0.034264564514160156, -0.03147125244140625, -0.028677940368652344, -0.025884628295898438, -0.02309131622314453, -0.020298004150390625, -0.01750469207763672, -0.014711380004882812, -0.011918067932128906, -0.009124755859375, -0.006331443786621094, -0.0035381317138671875, -0.0007448196411132812, 0.002048492431640625, 0.004841804504394531, 0.0076351165771484375, 0.010428428649902344, 0.01322174072265625, 0.016015052795410156, 0.018808364868164062, 0.02160167694091797, 0.024394989013671875, 0.02718830108642578, 0.029981613159179688, 0.032774925231933594, 0.0355682373046875, 0.038361549377441406, 0.04115486145019531, 0.04394817352294922, 0.046741485595703125, 0.04953479766845703, 0.05232810974121094, 0.055121421813964844, 0.05791473388671875, 0.060708045959472656, 0.06350135803222656, 0.06629467010498047, 0.06908798217773438, 0.07188129425048828, 0.07467460632324219, 0.0774679183959961, 0.08026123046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 2.0, 12.0, 21.0, 31.0, 58.0, 73.0, 132.0, 273.0, 535.0, 955.0, 2219.0, 5493.0, 15463.0, 54555.0, 269682.0, 2196587.0, 1409609.0, 178840.0, 39663.0, 11908.0, 4420.0, 1924.0, 876.0, 438.0, 226.0, 117.0, 70.0, 38.0, 29.0, 13.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041778564453125, -0.040425777435302734, -0.03907299041748047, -0.0377202033996582, -0.03636741638183594, -0.03501462936401367, -0.033661842346191406, -0.03230905532836914, -0.030956268310546875, -0.02960348129272461, -0.028250694274902344, -0.026897907257080078, -0.025545120239257812, -0.024192333221435547, -0.02283954620361328, -0.021486759185791016, -0.02013397216796875, -0.018781185150146484, -0.01742839813232422, -0.016075611114501953, -0.014722824096679688, -0.013370037078857422, -0.012017250061035156, -0.01066446304321289, -0.009311676025390625, -0.00795888900756836, -0.006606101989746094, -0.005253314971923828, -0.0039005279541015625, -0.002547740936279297, -0.0011949539184570312, 0.00015783309936523438, 0.0015106201171875, 0.0028634071350097656, 0.004216194152832031, 0.005568981170654297, 0.0069217681884765625, 0.008274555206298828, 0.009627342224121094, 0.01098012924194336, 0.012332916259765625, 0.01368570327758789, 0.015038490295410156, 0.016391277313232422, 0.017744064331054688, 0.019096851348876953, 0.02044963836669922, 0.021802425384521484, 0.02315521240234375, 0.024507999420166016, 0.02586078643798828, 0.027213573455810547, 0.028566360473632812, 0.029919147491455078, 0.031271934509277344, 0.03262472152709961, 0.033977508544921875, 0.03533029556274414, 0.036683082580566406, 0.03803586959838867, 0.03938865661621094, 0.0407414436340332, 0.04209423065185547, 0.043447017669677734, 0.0447998046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 20.0, 16.0, 33.0, 34.0, 85.0, 153.0, 273.0, 537.0, 775.0, 820.0, 573.0, 300.0, 184.0, 98.0, 48.0, 36.0, 21.0, 19.0, 8.0, 6.0, 5.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0440673828125, -0.04273366928100586, -0.04139995574951172, -0.04006624221801758, -0.03873252868652344, -0.0373988151550293, -0.036065101623535156, -0.034731388092041016, -0.033397674560546875, -0.032063961029052734, -0.030730247497558594, -0.029396533966064453, -0.028062820434570312, -0.026729106903076172, -0.02539539337158203, -0.02406167984008789, -0.02272796630859375, -0.02139425277709961, -0.02006053924560547, -0.018726825714111328, -0.017393112182617188, -0.016059398651123047, -0.014725685119628906, -0.013391971588134766, -0.012058258056640625, -0.010724544525146484, -0.009390830993652344, -0.008057117462158203, -0.0067234039306640625, -0.005389690399169922, -0.004055976867675781, -0.0027222633361816406, -0.0013885498046875, -5.4836273193359375e-05, 0.0012788772583007812, 0.002612590789794922, 0.0039463043212890625, 0.005280017852783203, 0.006613731384277344, 0.007947444915771484, 0.009281158447265625, 0.010614871978759766, 0.011948585510253906, 0.013282299041748047, 0.014616012573242188, 0.015949726104736328, 0.01728343963623047, 0.01861715316772461, 0.01995086669921875, 0.02128458023071289, 0.02261829376220703, 0.023952007293701172, 0.025285720825195312, 0.026619434356689453, 0.027953147888183594, 0.029286861419677734, 0.030620574951171875, 0.031954288482666016, 0.033288002014160156, 0.0346217155456543, 0.03595542907714844, 0.03728914260864258, 0.03862285614013672, 0.03995656967163086, 0.041290283203125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 19.0, 71.0, 144.0, 302.0, 239.0, 141.0, 48.0, 22.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.5724175572395325, -0.5616039037704468, -0.5507901906967163, -0.5399765372276306, -0.5291628241539001, -0.5183491706848145, -0.507535457611084, -0.4967217743396759, -0.4859080910682678, -0.47509440779685974, -0.46428072452545166, -0.4534670412540436, -0.4426533579826355, -0.4318396747112274, -0.42102599143981934, -0.41021230816841125, -0.3993986248970032, -0.3885849416255951, -0.377771258354187, -0.36695757508277893, -0.35614389181137085, -0.34533020853996277, -0.3345165252685547, -0.3237028419971466, -0.3128891885280609, -0.30207550525665283, -0.29126182198524475, -0.28044813871383667, -0.2696344554424286, -0.2588207721710205, -0.24800708889961243, -0.23719340562820435, -0.22637970745563507, -0.215566024184227, -0.2047523409128189, -0.19393865764141083, -0.18312497437000275, -0.17231129109859467, -0.16149762272834778, -0.1506839394569397, -0.13987025618553162, -0.12905657291412354, -0.11824288964271545, -0.10742920637130737, -0.09661552309989929, -0.08580183982849121, -0.07498816400766373, -0.06417448073625565, -0.05336079001426697, -0.04254710674285889, -0.031733423471450806, -0.020919743925333023, -0.010106060653924942, 0.000707622617483139, 0.011521302163600922, 0.022334985435009003, 0.033148668706417084, 0.043962351977825165, 0.054776035249233246, 0.06558971107006073, 0.07640339434146881, 0.08721707761287689, 0.09803076088428497, 0.10884444415569305, 0.11965812742710114]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 8.0, 7.0, 10.0, 15.0, 13.0, 17.0, 28.0, 29.0, 31.0, 35.0, 35.0, 52.0, 42.0, 53.0, 48.0, 45.0, 53.0, 54.0, 47.0, 46.0, 36.0, 40.0, 37.0, 29.0, 33.0, 27.0, 17.0, 20.0, 23.0, 12.0, 13.0, 18.0, 6.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10895055532455444, -0.10589355230331421, -0.10283655673265457, -0.09977956116199493, -0.0967225581407547, -0.09366555511951447, -0.09060855954885483, -0.08755156397819519, -0.08449456095695496, -0.08143755793571472, -0.07838056236505508, -0.07532356679439545, -0.07226656377315521, -0.06920956075191498, -0.06615256518125534, -0.0630955696105957, -0.06003856658935547, -0.05698156729340553, -0.0539245679974556, -0.05086756870150566, -0.047810569405555725, -0.04475357010960579, -0.04169657081365585, -0.03863957151770592, -0.03558257222175598, -0.032525572925806046, -0.02946857362985611, -0.026411574333906174, -0.023354575037956238, -0.020297575742006302, -0.017240576446056366, -0.01418357715010643, -0.011126577854156494, -0.008069578558206558, -0.005012579262256622, -0.0019555799663066864, 0.0011014193296432495, 0.004158418625593185, 0.007215417921543121, 0.010272417217493057, 0.013329416513442993, 0.01638641580939293, 0.019443415105342865, 0.0225004144012928, 0.025557413697242737, 0.028614412993192673, 0.03167141228914261, 0.034728411585092545, 0.03778541088104248, 0.040842410176992416, 0.04389940947294235, 0.04695640876889229, 0.050013408064842224, 0.05307040736079216, 0.056127406656742096, 0.05918440595269203, 0.06224140524864197, 0.0652984082698822, 0.06835540384054184, 0.07141239941120148, 0.07446940243244171, 0.07752640545368195, 0.08058340102434158, 0.08364039659500122, 0.08669739961624146]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 6.0, 8.0, 8.0, 13.0, 19.0, 22.0, 35.0, 57.0, 68.0, 97.0, 164.0, 250.0, 334.0, 589.0, 1053.0, 2190.0, 5253.0, 15749.0, 53014.0, 188964.0, 439203.0, 240334.0, 69122.0, 20027.0, 6500.0, 2490.0, 1197.0, 659.0, 363.0, 234.0, 160.0, 110.0, 79.0, 59.0, 34.0, 24.0, 28.0, 10.0, 16.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061187744140625, -0.05912065505981445, -0.057053565979003906, -0.05498647689819336, -0.05291938781738281, -0.050852298736572266, -0.04878520965576172, -0.04671812057495117, -0.044651031494140625, -0.04258394241333008, -0.04051685333251953, -0.038449764251708984, -0.03638267517089844, -0.03431558609008789, -0.032248497009277344, -0.030181407928466797, -0.02811431884765625, -0.026047229766845703, -0.023980140686035156, -0.02191305160522461, -0.019845962524414062, -0.017778873443603516, -0.01571178436279297, -0.013644695281982422, -0.011577606201171875, -0.009510517120361328, -0.007443428039550781, -0.005376338958740234, -0.0033092498779296875, -0.0012421607971191406, 0.0008249282836914062, 0.002892017364501953, 0.0049591064453125, 0.007026195526123047, 0.009093284606933594, 0.01116037368774414, 0.013227462768554688, 0.015294551849365234, 0.01736164093017578, 0.019428730010986328, 0.021495819091796875, 0.023562908172607422, 0.02562999725341797, 0.027697086334228516, 0.029764175415039062, 0.03183126449584961, 0.033898353576660156, 0.0359654426574707, 0.03803253173828125, 0.0400996208190918, 0.042166709899902344, 0.04423379898071289, 0.04630088806152344, 0.048367977142333984, 0.05043506622314453, 0.05250215530395508, 0.054569244384765625, 0.05663633346557617, 0.05870342254638672, 0.060770511627197266, 0.06283760070800781, 0.06490468978881836, 0.0669717788696289, 0.06903886795043945, 0.07110595703125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 11.0, 19.0, 32.0, 44.0, 58.0, 82.0, 90.0, 114.0, 118.0, 107.0, 95.0, 75.0, 73.0, 35.0, 18.0, 10.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09564208984375, -0.09293556213378906, -0.09022903442382812, -0.08752250671386719, -0.08481597900390625, -0.08210945129394531, -0.07940292358398438, -0.07669639587402344, -0.0739898681640625, -0.07128334045410156, -0.06857681274414062, -0.06587028503417969, -0.06316375732421875, -0.06045722961425781, -0.057750701904296875, -0.05504417419433594, -0.052337646484375, -0.04963111877441406, -0.046924591064453125, -0.04421806335449219, -0.04151153564453125, -0.03880500793457031, -0.036098480224609375, -0.03339195251464844, -0.0306854248046875, -0.027978897094726562, -0.025272369384765625, -0.022565841674804688, -0.01985931396484375, -0.017152786254882812, -0.014446258544921875, -0.011739730834960938, -0.009033203125, -0.0063266754150390625, -0.003620147705078125, -0.0009136199951171875, 0.00179290771484375, 0.0044994354248046875, 0.007205963134765625, 0.009912490844726562, 0.0126190185546875, 0.015325546264648438, 0.018032073974609375, 0.020738601684570312, 0.02344512939453125, 0.026151657104492188, 0.028858184814453125, 0.03156471252441406, 0.034271240234375, 0.03697776794433594, 0.039684295654296875, 0.04239082336425781, 0.04509735107421875, 0.04780387878417969, 0.050510406494140625, 0.05321693420410156, 0.0559234619140625, 0.05862998962402344, 0.061336517333984375, 0.06404304504394531, 0.06674957275390625, 0.06945610046386719, 0.07216262817382812, 0.07486915588378906, 0.07757568359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 6.0, 12.0, 19.0, 8.0, 16.0, 13.0, 23.0, 19.0, 20.0, 29.0, 39.0, 49.0, 86.0, 144.0, 321.0, 1016.0, 3907.0, 20769.0, 144657.0, 601424.0, 234116.0, 33809.0, 5758.0, 1338.0, 416.0, 165.0, 91.0, 50.0, 38.0, 21.0, 19.0, 13.0, 21.0, 26.0, 13.0, 13.0, 10.0, 14.0, 7.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0858154296875, -0.08318519592285156, -0.08055496215820312, -0.07792472839355469, -0.07529449462890625, -0.07266426086425781, -0.07003402709960938, -0.06740379333496094, -0.0647735595703125, -0.06214332580566406, -0.059513092041015625, -0.05688285827636719, -0.05425262451171875, -0.05162239074707031, -0.048992156982421875, -0.04636192321777344, -0.043731689453125, -0.04110145568847656, -0.038471221923828125, -0.03584098815917969, -0.03321075439453125, -0.030580520629882812, -0.027950286865234375, -0.025320053100585938, -0.0226898193359375, -0.020059585571289062, -0.017429351806640625, -0.014799118041992188, -0.01216888427734375, -0.009538650512695312, -0.006908416748046875, -0.0042781829833984375, -0.00164794921875, 0.0009822845458984375, 0.003612518310546875, 0.0062427520751953125, 0.00887298583984375, 0.011503219604492188, 0.014133453369140625, 0.016763687133789062, 0.0193939208984375, 0.022024154663085938, 0.024654388427734375, 0.027284622192382812, 0.02991485595703125, 0.03254508972167969, 0.035175323486328125, 0.03780555725097656, 0.040435791015625, 0.04306602478027344, 0.045696258544921875, 0.04832649230957031, 0.05095672607421875, 0.05358695983886719, 0.056217193603515625, 0.05884742736816406, 0.0614776611328125, 0.06410789489746094, 0.06673812866210938, 0.06936836242675781, 0.07199859619140625, 0.07462882995605469, 0.07725906372070312, 0.07988929748535156, 0.08251953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 3.0, 7.0, 5.0, 8.0, 9.0, 10.0, 11.0, 16.0, 22.0, 18.0, 25.0, 19.0, 17.0, 18.0, 21.0, 34.0, 45.0, 27.0, 32.0, 42.0, 37.0, 42.0, 31.0, 49.0, 31.0, 53.0, 33.0, 42.0, 28.0, 35.0, 29.0, 29.0, 21.0, 13.0, 26.0, 22.0, 16.0, 14.0, 13.0, 11.0, 12.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0665283203125, -0.06438732147216797, -0.06224632263183594, -0.060105323791503906, -0.057964324951171875, -0.055823326110839844, -0.05368232727050781, -0.05154132843017578, -0.04940032958984375, -0.04725933074951172, -0.04511833190917969, -0.042977333068847656, -0.040836334228515625, -0.038695335388183594, -0.03655433654785156, -0.03441333770751953, -0.0322723388671875, -0.03013134002685547, -0.027990341186523438, -0.025849342346191406, -0.023708343505859375, -0.021567344665527344, -0.019426345825195312, -0.01728534698486328, -0.01514434814453125, -0.013003349304199219, -0.010862350463867188, -0.008721351623535156, -0.006580352783203125, -0.004439353942871094, -0.0022983551025390625, -0.00015735626220703125, 0.001983642578125, 0.004124641418457031, 0.0062656402587890625, 0.008406639099121094, 0.010547637939453125, 0.012688636779785156, 0.014829635620117188, 0.01697063446044922, 0.01911163330078125, 0.02125263214111328, 0.023393630981445312, 0.025534629821777344, 0.027675628662109375, 0.029816627502441406, 0.03195762634277344, 0.03409862518310547, 0.0362396240234375, 0.03838062286376953, 0.04052162170410156, 0.042662620544433594, 0.044803619384765625, 0.046944618225097656, 0.04908561706542969, 0.05122661590576172, 0.05336761474609375, 0.05550861358642578, 0.05764961242675781, 0.059790611267089844, 0.061931610107421875, 0.0640726089477539, 0.06621360778808594, 0.06835460662841797, 0.07049560546875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 4.0, 8.0, 10.0, 9.0, 14.0, 14.0, 18.0, 50.0, 48.0, 70.0, 106.0, 163.0, 233.0, 320.0, 473.0, 687.0, 1023.0, 1573.0, 2518.0, 4139.0, 7175.0, 13186.0, 24946.0, 50630.0, 114269.0, 244149.0, 288670.0, 154662.0, 67782.0, 32174.0, 16628.0, 9065.0, 5127.0, 3037.0, 1880.0, 1182.0, 773.0, 523.0, 351.0, 238.0, 172.0, 113.0, 87.0, 82.0, 52.0, 35.0, 30.0, 19.0, 13.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0116424560546875, -0.01129162311553955, -0.010940790176391602, -0.010589957237243652, -0.010239124298095703, -0.009888291358947754, -0.009537458419799805, -0.009186625480651855, -0.008835792541503906, -0.008484959602355957, -0.008134126663208008, -0.007783293724060059, -0.007432460784912109, -0.00708162784576416, -0.006730794906616211, -0.006379961967468262, -0.0060291290283203125, -0.005678296089172363, -0.005327463150024414, -0.004976630210876465, -0.004625797271728516, -0.004274964332580566, -0.003924131393432617, -0.003573298454284668, -0.0032224655151367188, -0.0028716325759887695, -0.0025207996368408203, -0.002169966697692871, -0.0018191337585449219, -0.0014683008193969727, -0.0011174678802490234, -0.0007666349411010742, -0.000415802001953125, -6.496906280517578e-05, 0.00028586387634277344, 0.0006366968154907227, 0.0009875297546386719, 0.001338362693786621, 0.0016891956329345703, 0.0020400285720825195, 0.0023908615112304688, 0.002741694450378418, 0.003092527389526367, 0.0034433603286743164, 0.0037941932678222656, 0.004145026206970215, 0.004495859146118164, 0.004846692085266113, 0.0051975250244140625, 0.005548357963562012, 0.005899190902709961, 0.00625002384185791, 0.006600856781005859, 0.006951689720153809, 0.007302522659301758, 0.007653355598449707, 0.008004188537597656, 0.008355021476745605, 0.008705854415893555, 0.009056687355041504, 0.009407520294189453, 0.009758353233337402, 0.010109186172485352, 0.0104600191116333, 0.01081085205078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 9.0, 10.0, 9.0, 22.0, 21.0, 20.0, 28.0, 24.0, 44.0, 42.0, 38.0, 59.0, 56.0, 66.0, 50.0, 55.0, 64.0, 43.0, 56.0, 44.0, 40.0, 23.0, 25.0, 34.0, 13.0, 22.0, 14.0, 10.0, 14.0, 8.0, 12.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.258487701416016e-06, -6.055459380149841e-06, -5.852431058883667e-06, -5.649402737617493e-06, -5.446374416351318e-06, -5.243346095085144e-06, -5.04031777381897e-06, -4.837289452552795e-06, -4.634261131286621e-06, -4.431232810020447e-06, -4.2282044887542725e-06, -4.025176167488098e-06, -3.822147846221924e-06, -3.6191195249557495e-06, -3.416091203689575e-06, -3.213062882423401e-06, -3.0100345611572266e-06, -2.8070062398910522e-06, -2.603977918624878e-06, -2.4009495973587036e-06, -2.1979212760925293e-06, -1.994892954826355e-06, -1.7918646335601807e-06, -1.5888363122940063e-06, -1.385807991027832e-06, -1.1827796697616577e-06, -9.797513484954834e-07, -7.767230272293091e-07, -5.736947059631348e-07, -3.7066638469696045e-07, -1.6763806343078613e-07, 3.5390257835388184e-08, 2.384185791015625e-07, 4.414469003677368e-07, 6.444752216339111e-07, 8.475035429000854e-07, 1.0505318641662598e-06, 1.253560185432434e-06, 1.4565885066986084e-06, 1.6596168279647827e-06, 1.862645149230957e-06, 2.0656734704971313e-06, 2.2687017917633057e-06, 2.47173011302948e-06, 2.6747584342956543e-06, 2.8777867555618286e-06, 3.080815076828003e-06, 3.2838433980941772e-06, 3.4868717193603516e-06, 3.689900040626526e-06, 3.8929283618927e-06, 4.0959566831588745e-06, 4.298985004425049e-06, 4.502013325691223e-06, 4.7050416469573975e-06, 4.908069968223572e-06, 5.111098289489746e-06, 5.31412661075592e-06, 5.517154932022095e-06, 5.720183253288269e-06, 5.923211574554443e-06, 6.126239895820618e-06, 6.329268217086792e-06, 6.532296538352966e-06, 6.735324859619141e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 6.0, 9.0, 24.0, 27.0, 35.0, 68.0, 93.0, 137.0, 192.0, 278.0, 470.0, 827.0, 1474.0, 2912.0, 6262.0, 14774.0, 39082.0, 122641.0, 369659.0, 328365.0, 102909.0, 33920.0, 12871.0, 5519.0, 2579.0, 1374.0, 767.0, 433.0, 294.0, 153.0, 131.0, 87.0, 54.0, 42.0, 20.0, 22.0, 9.0, 11.0, 5.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0188140869140625, -0.018259525299072266, -0.01770496368408203, -0.017150402069091797, -0.016595840454101562, -0.016041278839111328, -0.015486717224121094, -0.01493215560913086, -0.014377593994140625, -0.01382303237915039, -0.013268470764160156, -0.012713909149169922, -0.012159347534179688, -0.011604785919189453, -0.011050224304199219, -0.010495662689208984, -0.00994110107421875, -0.009386539459228516, -0.008831977844238281, -0.008277416229248047, -0.0077228546142578125, -0.007168292999267578, -0.006613731384277344, -0.006059169769287109, -0.005504608154296875, -0.004950046539306641, -0.004395484924316406, -0.003840923309326172, -0.0032863616943359375, -0.002731800079345703, -0.0021772384643554688, -0.0016226768493652344, -0.001068115234375, -0.0005135536193847656, 4.100799560546875e-05, 0.0005955696105957031, 0.0011501312255859375, 0.0017046928405761719, 0.0022592544555664062, 0.0028138160705566406, 0.003368377685546875, 0.003922939300537109, 0.004477500915527344, 0.005032062530517578, 0.0055866241455078125, 0.006141185760498047, 0.006695747375488281, 0.007250308990478516, 0.00780487060546875, 0.008359432220458984, 0.008913993835449219, 0.009468555450439453, 0.010023117065429688, 0.010577678680419922, 0.011132240295410156, 0.01168680191040039, 0.012241363525390625, 0.01279592514038086, 0.013350486755371094, 0.013905048370361328, 0.014459609985351562, 0.015014171600341797, 0.015568733215332031, 0.016123294830322266, 0.0166778564453125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 9.0, 7.0, 9.0, 13.0, 9.0, 9.0, 18.0, 20.0, 32.0, 35.0, 43.0, 53.0, 80.0, 89.0, 69.0, 71.0, 83.0, 71.0, 56.0, 52.0, 37.0, 26.0, 16.0, 21.0, 18.0, 13.0, 10.0, 5.0, 3.0, 6.0, 4.0, 2.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0137176513671875, -0.013248920440673828, -0.012780189514160156, -0.012311458587646484, -0.011842727661132812, -0.01137399673461914, -0.010905265808105469, -0.010436534881591797, -0.009967803955078125, -0.009499073028564453, -0.009030342102050781, -0.00856161117553711, -0.008092880249023438, -0.007624149322509766, -0.007155418395996094, -0.006686687469482422, -0.00621795654296875, -0.005749225616455078, -0.005280494689941406, -0.004811763763427734, -0.0043430328369140625, -0.0038743019104003906, -0.0034055709838867188, -0.002936840057373047, -0.002468109130859375, -0.001999378204345703, -0.0015306472778320312, -0.0010619163513183594, -0.0005931854248046875, -0.00012445449829101562, 0.00034427642822265625, 0.0008130073547363281, 0.00128173828125, 0.0017504692077636719, 0.0022192001342773438, 0.0026879310607910156, 0.0031566619873046875, 0.0036253929138183594, 0.004094123840332031, 0.004562854766845703, 0.005031585693359375, 0.005500316619873047, 0.005969047546386719, 0.006437778472900391, 0.0069065093994140625, 0.007375240325927734, 0.007843971252441406, 0.008312702178955078, 0.00878143310546875, 0.009250164031982422, 0.009718894958496094, 0.010187625885009766, 0.010656356811523438, 0.01112508773803711, 0.011593818664550781, 0.012062549591064453, 0.012531280517578125, 0.013000011444091797, 0.013468742370605469, 0.01393747329711914, 0.014406204223632812, 0.014874935150146484, 0.015343666076660156, 0.015812397003173828, 0.0162811279296875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 14.0, 56.0, 225.0, 388.0, 226.0, 69.0, 28.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1836555004119873, -0.16432428359985352, -0.14499308168888092, -0.12566187977790833, -0.10633066296577454, -0.08699945360422134, -0.06766824424266815, -0.04833704233169556, -0.029005825519561768, -0.009674616158008575, 0.009656593203544617, 0.02898780256509781, 0.048319011926651, 0.0676502212882042, 0.08698143064975739, 0.10631263256072998, 0.12564384937286377, 0.14497506618499756, 0.16430626809597015, 0.18363747000694275, 0.20296868681907654, 0.22229990363121033, 0.24163110554218292, 0.2609623074531555, 0.2802935242652893, 0.2996247410774231, 0.3189559578895569, 0.3382871448993683, 0.3576183617115021, 0.37694957852363586, 0.39628076553344727, 0.41561198234558105, 0.43494319915771484, 0.45427441596984863, 0.4736056327819824, 0.4929368197917938, 0.51226806640625, 0.531599223613739, 0.5509304404258728, 0.5702616572380066, 0.5895928740501404, 0.6089240908622742, 0.628255307674408, 0.6475865244865417, 0.6669176816940308, 0.6862488985061646, 0.7055801153182983, 0.7249113321304321, 0.7442425489425659, 0.7635737657546997, 0.7829049825668335, 0.8022361993789673, 0.8215674161911011, 0.8408985733985901, 0.8602297902107239, 0.8795610070228577, 0.8988922238349915, 0.9182234406471252, 0.937554657459259, 0.9568858742713928, 0.9762170314788818, 0.9955482482910156, 1.0148794651031494, 1.0342106819152832, 1.053541898727417]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 6.0, 2.0, 3.0, 4.0, 6.0, 5.0, 9.0, 6.0, 11.0, 20.0, 15.0, 20.0, 29.0, 27.0, 31.0, 31.0, 32.0, 30.0, 44.0, 31.0, 39.0, 41.0, 45.0, 37.0, 29.0, 47.0, 41.0, 30.0, 42.0, 38.0, 21.0, 39.0, 24.0, 17.0, 26.0, 16.0, 19.0, 20.0, 9.0, 11.0, 17.0, 9.0, 5.0, 5.0, 8.0, 1.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.1948336362838745, -0.1891840249300003, -0.1835343986749649, -0.1778847873210907, -0.1722351610660553, -0.1665855497121811, -0.16093593835830688, -0.15528631210327148, -0.14963668584823608, -0.14398707449436188, -0.13833744823932648, -0.13268783688545227, -0.12703821063041687, -0.12138859927654266, -0.11573898047208786, -0.11008936166763306, -0.10443975031375885, -0.09879013150930405, -0.09314051270484924, -0.08749090135097504, -0.08184127509593964, -0.07619166374206543, -0.07054204493761063, -0.06489242613315582, -0.05924280732870102, -0.053593188524246216, -0.04794356971979141, -0.04229395464062691, -0.036644335836172104, -0.0309947170317173, -0.025345101952552795, -0.019695483148097992, -0.014045864343643188, -0.00839624647051096, -0.0027466285973787308, 0.0029029883444309235, 0.008552607148885727, 0.01420222595334053, 0.019851841032505035, 0.02550145983695984, 0.031151078641414642, 0.036800697445869446, 0.04245031625032425, 0.048099931329488754, 0.05374955013394356, 0.05939916893839836, 0.06504878401756287, 0.07069840282201767, 0.07634802162647247, 0.08199764043092728, 0.08764725923538208, 0.09329687058925629, 0.09894649684429169, 0.1045961081981659, 0.1102457270026207, 0.1158953458070755, 0.1215449646115303, 0.1271945834159851, 0.13284419476985931, 0.13849382102489471, 0.14414343237876892, 0.14979305863380432, 0.15544266998767853, 0.16109228134155273, 0.16674190759658813]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 5.0, 8.0, 6.0, 13.0, 19.0, 19.0, 27.0, 36.0, 55.0, 60.0, 104.0, 99.0, 185.0, 334.0, 520.0, 1028.0, 1885.0, 4033.0, 10057.0, 39057.0, 250203.0, 2357748.0, 1330622.0, 154544.0, 27868.0, 8432.0, 3566.0, 1693.0, 910.0, 498.0, 261.0, 131.0, 83.0, 42.0, 37.0, 36.0, 21.0, 12.0, 9.0, 6.0, 4.0, 4.0, 3.0, 5.0, 4.0, 2.0], "bins": [-0.05963134765625, -0.058135986328125, -0.056640625, -0.055145263671875, -0.05364990234375, -0.052154541015625, -0.0506591796875, -0.049163818359375, -0.04766845703125, -0.046173095703125, -0.044677734375, -0.043182373046875, -0.04168701171875, -0.040191650390625, -0.0386962890625, -0.037200927734375, -0.03570556640625, -0.034210205078125, -0.03271484375, -0.031219482421875, -0.02972412109375, -0.028228759765625, -0.0267333984375, -0.025238037109375, -0.02374267578125, -0.022247314453125, -0.020751953125, -0.019256591796875, -0.01776123046875, -0.016265869140625, -0.0147705078125, -0.013275146484375, -0.01177978515625, -0.010284423828125, -0.0087890625, -0.007293701171875, -0.00579833984375, -0.004302978515625, -0.0028076171875, -0.001312255859375, 0.00018310546875, 0.001678466796875, 0.003173828125, 0.004669189453125, 0.00616455078125, 0.007659912109375, 0.0091552734375, 0.010650634765625, 0.01214599609375, 0.013641357421875, 0.01513671875, 0.016632080078125, 0.01812744140625, 0.019622802734375, 0.0211181640625, 0.022613525390625, 0.02410888671875, 0.025604248046875, 0.027099609375, 0.028594970703125, 0.03009033203125, 0.031585693359375, 0.0330810546875, 0.034576416015625, 0.03607177734375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 12.0, 22.0, 33.0, 45.0, 71.0, 85.0, 106.0, 128.0, 130.0, 107.0, 87.0, 59.0, 39.0, 37.0, 20.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09796142578125, -0.09523487091064453, -0.09250831604003906, -0.0897817611694336, -0.08705520629882812, -0.08432865142822266, -0.08160209655761719, -0.07887554168701172, -0.07614898681640625, -0.07342243194580078, -0.07069587707519531, -0.06796932220458984, -0.06524276733398438, -0.0625162124633789, -0.05978965759277344, -0.05706310272216797, -0.0543365478515625, -0.05160999298095703, -0.04888343811035156, -0.046156883239746094, -0.043430328369140625, -0.040703773498535156, -0.03797721862792969, -0.03525066375732422, -0.03252410888671875, -0.02979755401611328, -0.027070999145507812, -0.024344444274902344, -0.021617889404296875, -0.018891334533691406, -0.016164779663085938, -0.013438224792480469, -0.010711669921875, -0.007985115051269531, -0.0052585601806640625, -0.0025320053100585938, 0.000194549560546875, 0.0029211044311523438, 0.0056476593017578125, 0.008374214172363281, 0.01110076904296875, 0.013827323913574219, 0.016553878784179688, 0.019280433654785156, 0.022006988525390625, 0.024733543395996094, 0.027460098266601562, 0.03018665313720703, 0.0329132080078125, 0.03563976287841797, 0.03836631774902344, 0.041092872619628906, 0.043819427490234375, 0.046545982360839844, 0.04927253723144531, 0.05199909210205078, 0.05472564697265625, 0.05745220184326172, 0.06017875671386719, 0.06290531158447266, 0.06563186645507812, 0.0683584213256836, 0.07108497619628906, 0.07381153106689453, 0.0765380859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 9.0, 8.0, 9.0, 29.0, 53.0, 72.0, 135.0, 280.0, 473.0, 920.0, 1696.0, 3536.0, 7874.0, 18428.0, 48201.0, 164174.0, 891894.0, 2410842.0, 480249.0, 105271.0, 34600.0, 13613.0, 5975.0, 2797.0, 1426.0, 801.0, 400.0, 234.0, 121.0, 75.0, 44.0, 24.0, 13.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.044219970703125, -0.04315018653869629, -0.04208040237426758, -0.04101061820983887, -0.039940834045410156, -0.038871049880981445, -0.037801265716552734, -0.03673148155212402, -0.03566169738769531, -0.0345919132232666, -0.03352212905883789, -0.03245234489440918, -0.03138256072998047, -0.030312776565551758, -0.029242992401123047, -0.028173208236694336, -0.027103424072265625, -0.026033639907836914, -0.024963855743408203, -0.023894071578979492, -0.02282428741455078, -0.02175450325012207, -0.02068471908569336, -0.01961493492126465, -0.018545150756835938, -0.017475366592407227, -0.016405582427978516, -0.015335798263549805, -0.014266014099121094, -0.013196229934692383, -0.012126445770263672, -0.011056661605834961, -0.00998687744140625, -0.008917093276977539, -0.007847309112548828, -0.006777524948120117, -0.005707740783691406, -0.004637956619262695, -0.0035681724548339844, -0.0024983882904052734, -0.0014286041259765625, -0.00035881996154785156, 0.0007109642028808594, 0.0017807483673095703, 0.0028505325317382812, 0.003920316696166992, 0.004990100860595703, 0.006059885025024414, 0.007129669189453125, 0.008199453353881836, 0.009269237518310547, 0.010339021682739258, 0.011408805847167969, 0.01247859001159668, 0.01354837417602539, 0.014618158340454102, 0.015687942504882812, 0.016757726669311523, 0.017827510833740234, 0.018897294998168945, 0.019967079162597656, 0.021036863327026367, 0.022106647491455078, 0.02317643165588379, 0.0242462158203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 6.0, 5.0, 6.0, 5.0, 8.0, 5.0, 12.0, 17.0, 15.0, 36.0, 44.0, 44.0, 69.0, 129.0, 187.0, 263.0, 406.0, 574.0, 673.0, 467.0, 339.0, 264.0, 136.0, 112.0, 62.0, 48.0, 22.0, 30.0, 23.0, 16.0, 18.0, 5.0, 9.0, 4.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0223541259765625, -0.021533489227294922, -0.020712852478027344, -0.019892215728759766, -0.019071578979492188, -0.01825094223022461, -0.01743030548095703, -0.016609668731689453, -0.015789031982421875, -0.014968395233154297, -0.014147758483886719, -0.01332712173461914, -0.012506484985351562, -0.011685848236083984, -0.010865211486816406, -0.010044574737548828, -0.00922393798828125, -0.008403301239013672, -0.007582664489746094, -0.006762027740478516, -0.0059413909912109375, -0.005120754241943359, -0.004300117492675781, -0.003479480743408203, -0.002658843994140625, -0.0018382072448730469, -0.0010175704956054688, -0.00019693374633789062, 0.0006237030029296875, 0.0014443397521972656, 0.0022649765014648438, 0.003085613250732422, 0.00390625, 0.004726886749267578, 0.005547523498535156, 0.006368160247802734, 0.0071887969970703125, 0.00800943374633789, 0.008830070495605469, 0.009650707244873047, 0.010471343994140625, 0.011291980743408203, 0.012112617492675781, 0.01293325424194336, 0.013753890991210938, 0.014574527740478516, 0.015395164489746094, 0.016215801239013672, 0.01703643798828125, 0.017857074737548828, 0.018677711486816406, 0.019498348236083984, 0.020318984985351562, 0.02113962173461914, 0.02196025848388672, 0.022780895233154297, 0.023601531982421875, 0.024422168731689453, 0.02524280548095703, 0.02606344223022461, 0.026884078979492188, 0.027704715728759766, 0.028525352478027344, 0.029345989227294922, 0.0301666259765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 6.0, 11.0, 19.0, 22.0, 45.0, 62.0, 91.0, 83.0, 111.0, 116.0, 104.0, 108.0, 78.0, 50.0, 36.0, 21.0, 15.0, 6.0, 7.0, 7.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08133012056350708, -0.077098049223423, -0.07286597788333893, -0.06863391399383545, -0.06440184265375137, -0.0601697713136673, -0.05593770369887352, -0.05170563608407974, -0.047473564743995667, -0.04324149340391159, -0.03900942578911781, -0.034777358174324036, -0.03054528683423996, -0.026313217356801033, -0.022081147879362106, -0.01784907840192318, -0.013617008924484253, -0.009384939447045326, -0.0051528699696063995, -0.0009208004921674728, 0.003311268985271454, 0.0075433384627103806, 0.011775407940149307, 0.016007477417588234, 0.02023954689502716, 0.024471616372466087, 0.028703685849905014, 0.03293575346469879, 0.03716782480478287, 0.04139989614486694, 0.04563196375966072, 0.0498640313744545, 0.054096102714538574, 0.05832817405462265, 0.06256024539470673, 0.0667923092842102, 0.07102438062429428, 0.07525645196437836, 0.07948851585388184, 0.08372058719396591, 0.08795265853404999, 0.09218472987413406, 0.09641680121421814, 0.10064886510372162, 0.1048809364438057, 0.10911300778388977, 0.11334507167339325, 0.11757714301347733, 0.1218092143535614, 0.12604127824306488, 0.13027335703372955, 0.13450542092323303, 0.1387374997138977, 0.14296956360340118, 0.14720162749290466, 0.15143370628356934, 0.15566577017307281, 0.1598978340625763, 0.16412991285324097, 0.16836197674274445, 0.17259404063224792, 0.1768261194229126, 0.18105818331241608, 0.18529026210308075, 0.18952232599258423]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 4.0, 0.0, 2.0, 9.0, 10.0, 5.0, 21.0, 13.0, 17.0, 17.0, 18.0, 32.0, 27.0, 31.0, 23.0, 38.0, 32.0, 37.0, 46.0, 41.0, 48.0, 42.0, 34.0, 35.0, 35.0, 40.0, 36.0, 44.0, 35.0, 25.0, 32.0, 27.0, 25.0, 24.0, 18.0, 16.0, 9.0, 8.0, 13.0, 4.0, 7.0, 5.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06265407800674438, -0.06050029397010803, -0.05834650993347168, -0.056192729622125626, -0.05403894558548927, -0.05188516154885292, -0.049731381237506866, -0.047577597200870514, -0.04542381316423416, -0.04327002912759781, -0.041116245090961456, -0.0389624647796154, -0.03680868074297905, -0.0346548967063427, -0.03250111639499664, -0.03034733235836029, -0.028193548321723938, -0.026039764285087585, -0.023885982111096382, -0.02173219993710518, -0.019578415900468826, -0.017424631863832474, -0.01527084968984127, -0.013117066584527493, -0.010963283479213715, -0.008809500373899937, -0.006655717268586159, -0.004501934163272381, -0.002348151057958603, -0.00019436795264482498, 0.001959415152668953, 0.004113198257982731, 0.006266981363296509, 0.008420764468610287, 0.010574547573924065, 0.012728330679237843, 0.01488211378455162, 0.017035897821187973, 0.019189679995179176, 0.02134346216917038, 0.023497246205806732, 0.025651030242443085, 0.027804812416434288, 0.02995859459042549, 0.032112378627061844, 0.034266162663698196, 0.03641994297504425, 0.0385737270116806, 0.040727511048316956, 0.04288129508495331, 0.04503507912158966, 0.047188859432935715, 0.04934264346957207, 0.05149642750620842, 0.053650207817554474, 0.055803991854190826, 0.05795777589082718, 0.06011155992746353, 0.062265343964099884, 0.06441912800073624, 0.06657290458679199, 0.06872668862342834, 0.0708804726600647, 0.07303425669670105, 0.0751880407333374]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 12.0, 16.0, 22.0, 23.0, 37.0, 54.0, 74.0, 123.0, 138.0, 222.0, 323.0, 529.0, 1080.0, 2224.0, 5572.0, 16151.0, 53176.0, 189970.0, 434993.0, 241241.0, 69428.0, 20564.0, 6904.0, 2698.0, 1168.0, 607.0, 371.0, 269.0, 154.0, 127.0, 61.0, 60.0, 50.0, 29.0, 25.0, 15.0, 9.0, 6.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05352783203125, -0.05171966552734375, -0.0499114990234375, -0.04810333251953125, -0.046295166015625, -0.04448699951171875, -0.0426788330078125, -0.04087066650390625, -0.0390625, -0.03725433349609375, -0.0354461669921875, -0.03363800048828125, -0.031829833984375, -0.03002166748046875, -0.0282135009765625, -0.02640533447265625, -0.02459716796875, -0.02278900146484375, -0.0209808349609375, -0.01917266845703125, -0.017364501953125, -0.01555633544921875, -0.0137481689453125, -0.01194000244140625, -0.0101318359375, -0.00832366943359375, -0.0065155029296875, -0.00470733642578125, -0.002899169921875, -0.00109100341796875, 0.0007171630859375, 0.00252532958984375, 0.00433349609375, 0.00614166259765625, 0.0079498291015625, 0.00975799560546875, 0.011566162109375, 0.01337432861328125, 0.0151824951171875, 0.01699066162109375, 0.018798828125, 0.02060699462890625, 0.0224151611328125, 0.02422332763671875, 0.026031494140625, 0.02783966064453125, 0.0296478271484375, 0.03145599365234375, 0.03326416015625, 0.03507232666015625, 0.0368804931640625, 0.03868865966796875, 0.040496826171875, 0.04230499267578125, 0.0441131591796875, 0.04592132568359375, 0.0477294921875, 0.04953765869140625, 0.0513458251953125, 0.05315399169921875, 0.054962158203125, 0.05677032470703125, 0.0585784912109375, 0.06038665771484375, 0.06219482421875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 10.0, 19.0, 25.0, 35.0, 57.0, 97.0, 90.0, 117.0, 123.0, 112.0, 91.0, 78.0, 63.0, 28.0, 26.0, 11.0, 6.0, 9.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09174823760986328, -0.08907508850097656, -0.08640193939208984, -0.08372879028320312, -0.0810556411743164, -0.07838249206542969, -0.07570934295654297, -0.07303619384765625, -0.07036304473876953, -0.06768989562988281, -0.0650167465209961, -0.062343597412109375, -0.059670448303222656, -0.05699729919433594, -0.05432415008544922, -0.0516510009765625, -0.04897785186767578, -0.04630470275878906, -0.043631553649902344, -0.040958404541015625, -0.038285255432128906, -0.03561210632324219, -0.03293895721435547, -0.03026580810546875, -0.02759265899658203, -0.024919509887695312, -0.022246360778808594, -0.019573211669921875, -0.016900062561035156, -0.014226913452148438, -0.011553764343261719, -0.008880615234375, -0.006207466125488281, -0.0035343170166015625, -0.0008611679077148438, 0.001811981201171875, 0.004485130310058594, 0.0071582794189453125, 0.009831428527832031, 0.01250457763671875, 0.015177726745605469, 0.017850875854492188, 0.020524024963378906, 0.023197174072265625, 0.025870323181152344, 0.028543472290039062, 0.03121662139892578, 0.0338897705078125, 0.03656291961669922, 0.03923606872558594, 0.041909217834472656, 0.044582366943359375, 0.047255516052246094, 0.04992866516113281, 0.05260181427001953, 0.05527496337890625, 0.05794811248779297, 0.06062126159667969, 0.0632944107055664, 0.06596755981445312, 0.06864070892333984, 0.07131385803222656, 0.07398700714111328, 0.07666015625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 4.0, 7.0, 11.0, 7.0, 16.0, 6.0, 22.0, 22.0, 24.0, 28.0, 20.0, 37.0, 61.0, 75.0, 169.0, 570.0, 2604.0, 17957.0, 163678.0, 671110.0, 169820.0, 18459.0, 2728.0, 570.0, 187.0, 81.0, 52.0, 36.0, 15.0, 33.0, 27.0, 28.0, 17.0, 7.0, 6.0, 10.0, 12.0, 7.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08355712890625, -0.08081817626953125, -0.0780792236328125, -0.07534027099609375, -0.072601318359375, -0.06986236572265625, -0.0671234130859375, -0.06438446044921875, -0.0616455078125, -0.05890655517578125, -0.0561676025390625, -0.05342864990234375, -0.050689697265625, -0.04795074462890625, -0.0452117919921875, -0.04247283935546875, -0.03973388671875, -0.03699493408203125, -0.0342559814453125, -0.03151702880859375, -0.028778076171875, -0.02603912353515625, -0.0233001708984375, -0.02056121826171875, -0.017822265625, -0.01508331298828125, -0.0123443603515625, -0.00960540771484375, -0.006866455078125, -0.00412750244140625, -0.0013885498046875, 0.00135040283203125, 0.00408935546875, 0.00682830810546875, 0.0095672607421875, 0.01230621337890625, 0.015045166015625, 0.01778411865234375, 0.0205230712890625, 0.02326202392578125, 0.0260009765625, 0.02873992919921875, 0.0314788818359375, 0.03421783447265625, 0.036956787109375, 0.03969573974609375, 0.0424346923828125, 0.04517364501953125, 0.04791259765625, 0.05065155029296875, 0.0533905029296875, 0.05612945556640625, 0.058868408203125, 0.06160736083984375, 0.0643463134765625, 0.06708526611328125, 0.06982421875, 0.07256317138671875, 0.0753021240234375, 0.07804107666015625, 0.080780029296875, 0.08351898193359375, 0.0862579345703125, 0.08899688720703125, 0.09173583984375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 4.0, 1.0, 4.0, 9.0, 12.0, 12.0, 12.0, 9.0, 7.0, 14.0, 20.0, 22.0, 19.0, 34.0, 25.0, 29.0, 39.0, 38.0, 45.0, 30.0, 32.0, 40.0, 42.0, 30.0, 28.0, 50.0, 31.0, 21.0, 34.0, 37.0, 33.0, 37.0, 25.0, 21.0, 17.0, 30.0, 25.0, 18.0, 11.0, 16.0, 6.0, 7.0, 10.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06036376953125, -0.05838775634765625, -0.0564117431640625, -0.05443572998046875, -0.052459716796875, -0.05048370361328125, -0.0485076904296875, -0.04653167724609375, -0.0445556640625, -0.04257965087890625, -0.0406036376953125, -0.03862762451171875, -0.036651611328125, -0.03467559814453125, -0.0326995849609375, -0.03072357177734375, -0.02874755859375, -0.02677154541015625, -0.0247955322265625, -0.02281951904296875, -0.020843505859375, -0.01886749267578125, -0.0168914794921875, -0.01491546630859375, -0.012939453125, -0.01096343994140625, -0.0089874267578125, -0.00701141357421875, -0.005035400390625, -0.00305938720703125, -0.0010833740234375, 0.00089263916015625, 0.00286865234375, 0.00484466552734375, 0.0068206787109375, 0.00879669189453125, 0.010772705078125, 0.01274871826171875, 0.0147247314453125, 0.01670074462890625, 0.0186767578125, 0.02065277099609375, 0.0226287841796875, 0.02460479736328125, 0.026580810546875, 0.02855682373046875, 0.0305328369140625, 0.03250885009765625, 0.03448486328125, 0.03646087646484375, 0.0384368896484375, 0.04041290283203125, 0.042388916015625, 0.04436492919921875, 0.0463409423828125, 0.04831695556640625, 0.05029296875, 0.05226898193359375, 0.0542449951171875, 0.05622100830078125, 0.058197021484375, 0.06017303466796875, 0.0621490478515625, 0.06412506103515625, 0.06610107421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 16.0, 20.0, 24.0, 47.0, 80.0, 165.0, 247.0, 459.0, 745.0, 1442.0, 2759.0, 6160.0, 14946.0, 39069.0, 116844.0, 319712.0, 341777.0, 130905.0, 43782.0, 16198.0, 6605.0, 3110.0, 1497.0, 766.0, 486.0, 268.0, 156.0, 94.0, 58.0, 42.0, 34.0, 12.0, 10.0, 6.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016021728515625, -0.015551209449768066, -0.015080690383911133, -0.0146101713180542, -0.014139652252197266, -0.013669133186340332, -0.013198614120483398, -0.012728095054626465, -0.012257575988769531, -0.011787056922912598, -0.011316537857055664, -0.01084601879119873, -0.010375499725341797, -0.009904980659484863, -0.00943446159362793, -0.008963942527770996, -0.008493423461914062, -0.008022904396057129, -0.007552385330200195, -0.007081866264343262, -0.006611347198486328, -0.0061408281326293945, -0.005670309066772461, -0.005199790000915527, -0.004729270935058594, -0.00425875186920166, -0.0037882328033447266, -0.003317713737487793, -0.0028471946716308594, -0.0023766756057739258, -0.0019061565399169922, -0.0014356374740600586, -0.000965118408203125, -0.0004945993423461914, -2.4080276489257812e-05, 0.0004464387893676758, 0.0009169578552246094, 0.001387476921081543, 0.0018579959869384766, 0.00232851505279541, 0.0027990341186523438, 0.0032695531845092773, 0.003740072250366211, 0.0042105913162231445, 0.004681110382080078, 0.005151629447937012, 0.005622148513793945, 0.006092667579650879, 0.0065631866455078125, 0.007033705711364746, 0.00750422477722168, 0.007974743843078613, 0.008445262908935547, 0.00891578197479248, 0.009386301040649414, 0.009856820106506348, 0.010327339172363281, 0.010797858238220215, 0.011268377304077148, 0.011738896369934082, 0.012209415435791016, 0.01267993450164795, 0.013150453567504883, 0.013620972633361816, 0.01409149169921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 2.0, 18.0, 14.0, 23.0, 29.0, 50.0, 69.0, 93.0, 90.0, 81.0, 135.0, 123.0, 82.0, 53.0, 29.0, 47.0, 24.0, 14.0, 12.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.106231689453125e-06, -7.701106369495392e-06, -7.295981049537659e-06, -6.8908557295799255e-06, -6.485730409622192e-06, -6.080605089664459e-06, -5.675479769706726e-06, -5.270354449748993e-06, -4.86522912979126e-06, -4.460103809833527e-06, -4.0549784898757935e-06, -3.6498531699180603e-06, -3.244727849960327e-06, -2.839602530002594e-06, -2.434477210044861e-06, -2.0293518900871277e-06, -1.6242265701293945e-06, -1.2191012501716614e-06, -8.139759302139282e-07, -4.0885061025619507e-07, -3.725290298461914e-09, 4.0140002965927124e-07, 8.065253496170044e-07, 1.2116506695747375e-06, 1.6167759895324707e-06, 2.021901309490204e-06, 2.427026629447937e-06, 2.83215194940567e-06, 3.2372772693634033e-06, 3.6424025893211365e-06, 4.04752790927887e-06, 4.452653229236603e-06, 4.857778549194336e-06, 5.262903869152069e-06, 5.668029189109802e-06, 6.073154509067535e-06, 6.4782798290252686e-06, 6.883405148983002e-06, 7.288530468940735e-06, 7.693655788898468e-06, 8.098781108856201e-06, 8.503906428813934e-06, 8.909031748771667e-06, 9.3141570687294e-06, 9.719282388687134e-06, 1.0124407708644867e-05, 1.05295330286026e-05, 1.0934658348560333e-05, 1.1339783668518066e-05, 1.17449089884758e-05, 1.2150034308433533e-05, 1.2555159628391266e-05, 1.2960284948348999e-05, 1.3365410268306732e-05, 1.3770535588264465e-05, 1.4175660908222198e-05, 1.4580786228179932e-05, 1.4985911548137665e-05, 1.5391036868095398e-05, 1.579616218805313e-05, 1.6201287508010864e-05, 1.6606412827968597e-05, 1.701153814792633e-05, 1.7416663467884064e-05, 1.7821788787841797e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 5.0, 8.0, 19.0, 16.0, 34.0, 36.0, 70.0, 131.0, 264.0, 707.0, 2609.0, 13987.0, 126211.0, 709160.0, 172909.0, 17802.0, 3086.0, 842.0, 316.0, 118.0, 74.0, 50.0, 28.0, 17.0, 14.0, 6.0, 10.0, 11.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034088134765625, -0.03297281265258789, -0.03185749053955078, -0.030742168426513672, -0.029626846313476562, -0.028511524200439453, -0.027396202087402344, -0.026280879974365234, -0.025165557861328125, -0.024050235748291016, -0.022934913635253906, -0.021819591522216797, -0.020704269409179688, -0.019588947296142578, -0.01847362518310547, -0.01735830307006836, -0.01624298095703125, -0.01512765884399414, -0.014012336730957031, -0.012897014617919922, -0.011781692504882812, -0.010666370391845703, -0.009551048278808594, -0.008435726165771484, -0.007320404052734375, -0.006205081939697266, -0.005089759826660156, -0.003974437713623047, -0.0028591156005859375, -0.0017437934875488281, -0.0006284713745117188, 0.0004868507385253906, 0.0016021728515625, 0.0027174949645996094, 0.0038328170776367188, 0.004948139190673828, 0.0060634613037109375, 0.007178783416748047, 0.008294105529785156, 0.009409427642822266, 0.010524749755859375, 0.011640071868896484, 0.012755393981933594, 0.013870716094970703, 0.014986038208007812, 0.016101360321044922, 0.01721668243408203, 0.01833200454711914, 0.01944732666015625, 0.02056264877319336, 0.02167797088623047, 0.022793292999267578, 0.023908615112304688, 0.025023937225341797, 0.026139259338378906, 0.027254581451416016, 0.028369903564453125, 0.029485225677490234, 0.030600547790527344, 0.03171586990356445, 0.03283119201660156, 0.03394651412963867, 0.03506183624267578, 0.03617715835571289, 0.03729248046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 5.0, 7.0, 14.0, 22.0, 29.0, 52.0, 97.0, 127.0, 163.0, 153.0, 126.0, 79.0, 47.0, 33.0, 23.0, 9.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142059326171875, -0.013358831405639648, -0.012511730194091797, -0.011664628982543945, -0.010817527770996094, -0.009970426559448242, -0.00912332534790039, -0.008276224136352539, -0.0074291229248046875, -0.006582021713256836, -0.005734920501708984, -0.004887819290161133, -0.004040718078613281, -0.0031936168670654297, -0.002346515655517578, -0.0014994144439697266, -0.000652313232421875, 0.00019478797912597656, 0.0010418891906738281, 0.0018889904022216797, 0.0027360916137695312, 0.003583192825317383, 0.004430294036865234, 0.005277395248413086, 0.0061244964599609375, 0.006971597671508789, 0.00781869888305664, 0.008665800094604492, 0.009512901306152344, 0.010360002517700195, 0.011207103729248047, 0.012054204940795898, 0.01290130615234375, 0.013748407363891602, 0.014595508575439453, 0.015442609786987305, 0.016289710998535156, 0.017136812210083008, 0.01798391342163086, 0.01883101463317871, 0.019678115844726562, 0.020525217056274414, 0.021372318267822266, 0.022219419479370117, 0.02306652069091797, 0.02391362190246582, 0.024760723114013672, 0.025607824325561523, 0.026454925537109375, 0.027302026748657227, 0.028149127960205078, 0.02899622917175293, 0.02984333038330078, 0.030690431594848633, 0.031537532806396484, 0.032384634017944336, 0.03323173522949219, 0.03407883644104004, 0.03492593765258789, 0.03577303886413574, 0.036620140075683594, 0.037467241287231445, 0.0383143424987793, 0.03916144371032715, 0.040008544921875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 12.0, 16.0, 46.0, 104.0, 188.0, 254.0, 201.0, 106.0, 48.0, 20.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16989654302597046, -0.15891921520233154, -0.14794187247753143, -0.13696454465389252, -0.1259872019290924, -0.11500987410545349, -0.10403253883123398, -0.09305520355701447, -0.08207786828279495, -0.07110053300857544, -0.060123197734355927, -0.04914586618542671, -0.0381685309112072, -0.027191195636987686, -0.01621386408805847, -0.005236528813838959, 0.005740806460380554, 0.016718141734600067, 0.02769547514617443, 0.038672808557748795, 0.04965014383196831, 0.06062747910618782, 0.07160481065511703, 0.08258214592933655, 0.09355948120355606, 0.10453681647777557, 0.11551415175199509, 0.1264914870262146, 0.13746881484985352, 0.14844615757465363, 0.15942348539829254, 0.17040082812309265, 0.18137815594673157, 0.19235548377037048, 0.2033328264951706, 0.2143101543188095, 0.22528749704360962, 0.23626482486724854, 0.24724215269088745, 0.25821948051452637, 0.26919683814048767, 0.2801741659641266, 0.2911514937877655, 0.3021288514137268, 0.3131061792373657, 0.32408350706100464, 0.33506083488464355, 0.34603816270828247, 0.3570154905319214, 0.3679928183555603, 0.3789701461791992, 0.3899475038051605, 0.40092483162879944, 0.41190215945243835, 0.42287948727607727, 0.4338568449020386, 0.4448341727256775, 0.4558115005493164, 0.4667888283729553, 0.4777661859989166, 0.48874351382255554, 0.49972084164619446, 0.5106981992721558, 0.5216755270957947, 0.5326528549194336]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 10.0, 15.0, 12.0, 25.0, 17.0, 16.0, 21.0, 34.0, 37.0, 41.0, 32.0, 46.0, 33.0, 46.0, 48.0, 48.0, 52.0, 46.0, 38.0, 46.0, 43.0, 39.0, 44.0, 37.0, 29.0, 14.0, 30.0, 21.0, 7.0, 11.0, 6.0, 8.0, 3.0, 5.0, 9.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.18048226833343506, -0.17455172538757324, -0.16862118244171143, -0.1626906394958496, -0.1567600965499878, -0.15082955360412598, -0.14489901065826416, -0.13896846771240234, -0.13303792476654053, -0.1271073818206787, -0.1211768388748169, -0.11524629592895508, -0.10931575298309326, -0.10338521003723145, -0.09745465964078903, -0.09152411669492722, -0.0855935662984848, -0.07966302335262299, -0.07373248040676117, -0.06780193746089935, -0.06187139078974724, -0.05594084784388542, -0.05001030117273331, -0.04407975822687149, -0.038149215281009674, -0.03221867233514786, -0.026288127526640892, -0.020357582718133926, -0.01442703977227211, -0.008496496826410294, -0.0025659501552581787, 0.0033645927906036377, 0.009295135736465454, 0.015225679613649845, 0.021156223490834236, 0.027086768299341202, 0.03301731124520302, 0.038947854191064835, 0.04487840086221695, 0.050808943808078766, 0.05673948675394058, 0.0626700296998024, 0.06860057264566422, 0.07453112304210663, 0.08046166598796844, 0.08639220893383026, 0.09232275187969208, 0.0982532948255539, 0.10418383777141571, 0.11011438071727753, 0.11604492366313934, 0.12197546660900116, 0.12790600955486298, 0.1338365525007248, 0.1397671103477478, 0.14569765329360962, 0.15162819623947144, 0.15755873918533325, 0.16348928213119507, 0.16941982507705688, 0.1753503680229187, 0.18128091096878052, 0.18721145391464233, 0.19314199686050415, 0.19907253980636597]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 8.0, 10.0, 13.0, 39.0, 71.0, 115.0, 239.0, 571.0, 1744.0, 7637.0, 75680.0, 3629248.0, 458058.0, 16251.0, 3153.0, 819.0, 332.0, 153.0, 59.0, 41.0, 19.0, 13.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.12322998046875, -0.1194620132446289, -0.11569404602050781, -0.11192607879638672, -0.10815811157226562, -0.10439014434814453, -0.10062217712402344, -0.09685420989990234, -0.09308624267578125, -0.08931827545166016, -0.08555030822753906, -0.08178234100341797, -0.07801437377929688, -0.07424640655517578, -0.07047843933105469, -0.0667104721069336, -0.0629425048828125, -0.059174537658691406, -0.05540657043457031, -0.05163860321044922, -0.047870635986328125, -0.04410266876220703, -0.04033470153808594, -0.036566734313964844, -0.03279876708984375, -0.029030799865722656, -0.025262832641601562, -0.02149486541748047, -0.017726898193359375, -0.013958930969238281, -0.010190963745117188, -0.006422996520996094, -0.002655029296875, 0.0011129379272460938, 0.0048809051513671875, 0.008648872375488281, 0.012416839599609375, 0.01618480682373047, 0.019952774047851562, 0.023720741271972656, 0.02748870849609375, 0.031256675720214844, 0.03502464294433594, 0.03879261016845703, 0.042560577392578125, 0.04632854461669922, 0.05009651184082031, 0.053864479064941406, 0.0576324462890625, 0.061400413513183594, 0.06516838073730469, 0.06893634796142578, 0.07270431518554688, 0.07647228240966797, 0.08024024963378906, 0.08400821685791016, 0.08777618408203125, 0.09154415130615234, 0.09531211853027344, 0.09908008575439453, 0.10284805297851562, 0.10661602020263672, 0.11038398742675781, 0.1141519546508789, 0.117919921875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 10.0, 18.0, 39.0, 55.0, 59.0, 110.0, 112.0, 134.0, 111.0, 113.0, 76.0, 70.0, 40.0, 23.0, 16.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0958251953125, -0.09306144714355469, -0.09029769897460938, -0.08753395080566406, -0.08477020263671875, -0.08200645446777344, -0.07924270629882812, -0.07647895812988281, -0.0737152099609375, -0.07095146179199219, -0.06818771362304688, -0.06542396545410156, -0.06266021728515625, -0.05989646911621094, -0.057132720947265625, -0.05436897277832031, -0.051605224609375, -0.04884147644042969, -0.046077728271484375, -0.04331398010253906, -0.04055023193359375, -0.03778648376464844, -0.035022735595703125, -0.03225898742675781, -0.0294952392578125, -0.026731491088867188, -0.023967742919921875, -0.021203994750976562, -0.01844024658203125, -0.015676498413085938, -0.012912750244140625, -0.010149002075195312, -0.00738525390625, -0.0046215057373046875, -0.001857757568359375, 0.0009059906005859375, 0.00366973876953125, 0.0064334869384765625, 0.009197235107421875, 0.011960983276367188, 0.0147247314453125, 0.017488479614257812, 0.020252227783203125, 0.023015975952148438, 0.02577972412109375, 0.028543472290039062, 0.031307220458984375, 0.03407096862792969, 0.036834716796875, 0.03959846496582031, 0.042362213134765625, 0.04512596130371094, 0.04788970947265625, 0.05065345764160156, 0.053417205810546875, 0.05618095397949219, 0.0589447021484375, 0.06170845031738281, 0.06447219848632812, 0.06723594665527344, 0.06999969482421875, 0.07276344299316406, 0.07552719116210938, 0.07829093933105469, 0.0810546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 9.0, 9.0, 16.0, 26.0, 39.0, 69.0, 122.0, 210.0, 387.0, 805.0, 1585.0, 3594.0, 8435.0, 21887.0, 66748.0, 279377.0, 2138099.0, 1403838.0, 189511.0, 50095.0, 17042.0, 6593.0, 2939.0, 1330.0, 673.0, 356.0, 190.0, 125.0, 67.0, 34.0, 19.0, 17.0, 10.0, 12.0, 8.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033111572265625, -0.03187990188598633, -0.030648231506347656, -0.029416561126708984, -0.028184890747070312, -0.02695322036743164, -0.02572154998779297, -0.024489879608154297, -0.023258209228515625, -0.022026538848876953, -0.02079486846923828, -0.01956319808959961, -0.018331527709960938, -0.017099857330322266, -0.015868186950683594, -0.014636516571044922, -0.01340484619140625, -0.012173175811767578, -0.010941505432128906, -0.009709835052490234, -0.008478164672851562, -0.007246494293212891, -0.006014823913574219, -0.004783153533935547, -0.003551483154296875, -0.002319812774658203, -0.0010881423950195312, 0.00014352798461914062, 0.0013751983642578125, 0.0026068687438964844, 0.0038385391235351562, 0.005070209503173828, 0.0063018798828125, 0.007533550262451172, 0.008765220642089844, 0.009996891021728516, 0.011228561401367188, 0.01246023178100586, 0.013691902160644531, 0.014923572540283203, 0.016155242919921875, 0.017386913299560547, 0.01861858367919922, 0.01985025405883789, 0.021081924438476562, 0.022313594818115234, 0.023545265197753906, 0.024776935577392578, 0.02600860595703125, 0.027240276336669922, 0.028471946716308594, 0.029703617095947266, 0.030935287475585938, 0.03216695785522461, 0.03339862823486328, 0.03463029861450195, 0.035861968994140625, 0.0370936393737793, 0.03832530975341797, 0.03955698013305664, 0.04078865051269531, 0.042020320892333984, 0.043251991271972656, 0.04448366165161133, 0.04571533203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 8.0, 7.0, 21.0, 21.0, 30.0, 37.0, 58.0, 97.0, 162.0, 332.0, 599.0, 917.0, 763.0, 464.0, 242.0, 110.0, 70.0, 43.0, 28.0, 25.0, 14.0, 6.0, 1.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.065185546875, -0.06362342834472656, -0.062061309814453125, -0.06049919128417969, -0.05893707275390625, -0.05737495422363281, -0.055812835693359375, -0.05425071716308594, -0.0526885986328125, -0.05112648010253906, -0.049564361572265625, -0.04800224304199219, -0.04644012451171875, -0.04487800598144531, -0.043315887451171875, -0.04175376892089844, -0.040191650390625, -0.03862953186035156, -0.037067413330078125, -0.03550529479980469, -0.03394317626953125, -0.03238105773925781, -0.030818939208984375, -0.029256820678710938, -0.0276947021484375, -0.026132583618164062, -0.024570465087890625, -0.023008346557617188, -0.02144622802734375, -0.019884109497070312, -0.018321990966796875, -0.016759872436523438, -0.01519775390625, -0.013635635375976562, -0.012073516845703125, -0.010511398315429688, -0.00894927978515625, -0.0073871612548828125, -0.005825042724609375, -0.0042629241943359375, -0.0027008056640625, -0.0011386871337890625, 0.000423431396484375, 0.0019855499267578125, 0.00354766845703125, 0.0051097869873046875, 0.006671905517578125, 0.008234024047851562, 0.009796142578125, 0.011358261108398438, 0.012920379638671875, 0.014482498168945312, 0.01604461669921875, 0.017606735229492188, 0.019168853759765625, 0.020730972290039062, 0.0222930908203125, 0.023855209350585938, 0.025417327880859375, 0.026979446411132812, 0.02854156494140625, 0.030103683471679688, 0.031665802001953125, 0.03322792053222656, 0.0347900390625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 19.0, 31.0, 49.0, 50.0, 119.0, 127.0, 139.0, 141.0, 119.0, 77.0, 50.0, 33.0, 19.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.210373193025589, -0.20381109416484833, -0.19724899530410767, -0.1906868815422058, -0.18412478268146515, -0.1775626838207245, -0.17100058495998383, -0.16443848609924316, -0.1578763723373413, -0.15131427347660065, -0.14475217461585999, -0.13819006085395813, -0.13162796199321747, -0.1250658631324768, -0.11850376427173615, -0.11194166541099548, -0.10537956655025482, -0.09881746768951416, -0.0922553613781929, -0.08569326251745224, -0.07913115620613098, -0.07256905734539032, -0.06600695848464966, -0.0594448558986187, -0.05288275331258774, -0.04632065072655678, -0.03975854814052582, -0.033196449279785156, -0.026634346693754196, -0.020072244107723236, -0.013510145246982574, -0.006948042660951614, -0.00038592517375946045, 0.006176176480948925, 0.01273827813565731, 0.01930037885904312, 0.02586248144507408, 0.03242458403110504, 0.0389866828918457, 0.04554878547787666, 0.05211088806390762, 0.05867299064993858, 0.06523509323596954, 0.0717971920967102, 0.07835929095745087, 0.08492139726877213, 0.09148349612951279, 0.09804560244083405, 0.10460770130157471, 0.11116980016231537, 0.11773190647363663, 0.12429400533437729, 0.13085611164569855, 0.1374182105064392, 0.14398030936717987, 0.15054240822792053, 0.1571045219898224, 0.16366662085056305, 0.1702287197113037, 0.17679083347320557, 0.18335293233394623, 0.1899150311946869, 0.19647713005542755, 0.2030392289161682, 0.20960132777690887]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 7.0, 7.0, 14.0, 10.0, 11.0, 22.0, 12.0, 24.0, 26.0, 26.0, 27.0, 33.0, 37.0, 34.0, 44.0, 41.0, 41.0, 33.0, 39.0, 46.0, 39.0, 38.0, 44.0, 35.0, 41.0, 31.0, 31.0, 25.0, 28.0, 19.0, 14.0, 24.0, 22.0, 5.0, 15.0, 7.0, 12.0, 8.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.10558658838272095, -0.1027383953332901, -0.09989019483327866, -0.09704200178384781, -0.09419380128383636, -0.09134560823440552, -0.08849741518497467, -0.08564922213554382, -0.08280102163553238, -0.07995282858610153, -0.07710462808609009, -0.07425643503665924, -0.0714082419872284, -0.06856004148721695, -0.0657118484377861, -0.06286364793777466, -0.06001545488834381, -0.057167258113622665, -0.05431906133890152, -0.05147086828947067, -0.04862267151474953, -0.04577447474002838, -0.042926281690597534, -0.04007808491587639, -0.03722988814115524, -0.0343816913664341, -0.03153349459171295, -0.028685301542282104, -0.02583710476756096, -0.022988907992839813, -0.020140713080763817, -0.01729251816868782, -0.014444321393966675, -0.011596125550568104, -0.008747929707169533, -0.005899733863770962, -0.0030515380203723907, -0.00020334217697381973, 0.0026448536664247513, 0.005493048578500748, 0.008341245353221893, 0.011189441196620464, 0.014037637040019035, 0.016885831952095032, 0.019734028726816177, 0.022582225501537323, 0.02543042041361332, 0.028278615325689316, 0.03112681210041046, 0.03397500887513161, 0.03682320564985275, 0.0396713986992836, 0.042519595474004745, 0.04536779224872589, 0.04821598529815674, 0.051064182072877884, 0.05391237884759903, 0.056760575622320175, 0.05960877239704132, 0.06245696544647217, 0.06530515849590302, 0.06815335899591446, 0.0710015520453453, 0.07384975254535675, 0.0766979455947876]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 11.0, 10.0, 9.0, 12.0, 20.0, 18.0, 28.0, 49.0, 41.0, 81.0, 82.0, 138.0, 194.0, 253.0, 393.0, 608.0, 1230.0, 2674.0, 6836.0, 20380.0, 68141.0, 237961.0, 439391.0, 189392.0, 53577.0, 16400.0, 5539.0, 2174.0, 1074.0, 623.0, 364.0, 226.0, 175.0, 99.0, 78.0, 60.0, 45.0, 44.0, 33.0, 26.0, 22.0, 11.0, 6.0, 7.0, 5.0, 5.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.06648635864257812, -0.06436920166015625, -0.062252044677734375, -0.0601348876953125, -0.058017730712890625, -0.05590057373046875, -0.053783416748046875, -0.051666259765625, -0.049549102783203125, -0.04743194580078125, -0.045314788818359375, -0.0431976318359375, -0.041080474853515625, -0.03896331787109375, -0.036846160888671875, -0.03472900390625, -0.032611846923828125, -0.03049468994140625, -0.028377532958984375, -0.0262603759765625, -0.024143218994140625, -0.02202606201171875, -0.019908905029296875, -0.017791748046875, -0.015674591064453125, -0.01355743408203125, -0.011440277099609375, -0.0093231201171875, -0.007205963134765625, -0.00508880615234375, -0.002971649169921875, -0.0008544921875, 0.001262664794921875, 0.00337982177734375, 0.005496978759765625, 0.0076141357421875, 0.009731292724609375, 0.01184844970703125, 0.013965606689453125, 0.016082763671875, 0.018199920654296875, 0.02031707763671875, 0.022434234619140625, 0.0245513916015625, 0.026668548583984375, 0.02878570556640625, 0.030902862548828125, 0.03302001953125, 0.035137176513671875, 0.03725433349609375, 0.039371490478515625, 0.0414886474609375, 0.043605804443359375, 0.04572296142578125, 0.047840118408203125, 0.049957275390625, 0.052074432373046875, 0.05419158935546875, 0.056308746337890625, 0.0584259033203125, 0.060543060302734375, 0.06266021728515625, 0.06477737426757812, 0.06689453125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 15.0, 23.0, 38.0, 52.0, 77.0, 144.0, 125.0, 135.0, 126.0, 94.0, 76.0, 43.0, 26.0, 13.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1051025390625, -0.10219192504882812, -0.09928131103515625, -0.09637069702148438, -0.0934600830078125, -0.09054946899414062, -0.08763885498046875, -0.08472824096679688, -0.081817626953125, -0.07890701293945312, -0.07599639892578125, -0.07308578491210938, -0.0701751708984375, -0.06726455688476562, -0.06435394287109375, -0.061443328857421875, -0.05853271484375, -0.055622100830078125, -0.05271148681640625, -0.049800872802734375, -0.0468902587890625, -0.043979644775390625, -0.04106903076171875, -0.038158416748046875, -0.035247802734375, -0.032337188720703125, -0.02942657470703125, -0.026515960693359375, -0.0236053466796875, -0.020694732666015625, -0.01778411865234375, -0.014873504638671875, -0.011962890625, -0.009052276611328125, -0.00614166259765625, -0.003231048583984375, -0.0003204345703125, 0.002590179443359375, 0.00550079345703125, 0.008411407470703125, 0.011322021484375, 0.014232635498046875, 0.01714324951171875, 0.020053863525390625, 0.0229644775390625, 0.025875091552734375, 0.02878570556640625, 0.031696319580078125, 0.03460693359375, 0.037517547607421875, 0.04042816162109375, 0.043338775634765625, 0.0462493896484375, 0.049160003662109375, 0.05207061767578125, 0.054981231689453125, 0.057891845703125, 0.060802459716796875, 0.06371307373046875, 0.06662368774414062, 0.0695343017578125, 0.07244491577148438, 0.07535552978515625, 0.07826614379882812, 0.0811767578125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 9.0, 9.0, 16.0, 21.0, 32.0, 37.0, 67.0, 105.0, 170.0, 285.0, 608.0, 1234.0, 3533.0, 11435.0, 40618.0, 153582.0, 427789.0, 294560.0, 81828.0, 22134.0, 6532.0, 2145.0, 786.0, 395.0, 216.0, 136.0, 87.0, 53.0, 33.0, 24.0, 21.0, 10.0, 8.0, 11.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0526123046875, -0.050844669342041016, -0.04907703399658203, -0.04730939865112305, -0.04554176330566406, -0.04377412796020508, -0.042006492614746094, -0.04023885726928711, -0.038471221923828125, -0.03670358657836914, -0.034935951232910156, -0.03316831588745117, -0.03140068054199219, -0.029633045196533203, -0.02786540985107422, -0.026097774505615234, -0.02433013916015625, -0.022562503814697266, -0.02079486846923828, -0.019027233123779297, -0.017259597778320312, -0.015491962432861328, -0.013724327087402344, -0.01195669174194336, -0.010189056396484375, -0.00842142105102539, -0.006653785705566406, -0.004886150360107422, -0.0031185150146484375, -0.0013508796691894531, 0.00041675567626953125, 0.0021843910217285156, 0.0039520263671875, 0.005719661712646484, 0.007487297058105469, 0.009254932403564453, 0.011022567749023438, 0.012790203094482422, 0.014557838439941406, 0.01632547378540039, 0.018093109130859375, 0.01986074447631836, 0.021628379821777344, 0.023396015167236328, 0.025163650512695312, 0.026931285858154297, 0.02869892120361328, 0.030466556549072266, 0.03223419189453125, 0.034001827239990234, 0.03576946258544922, 0.0375370979309082, 0.03930473327636719, 0.04107236862182617, 0.042840003967285156, 0.04460763931274414, 0.046375274658203125, 0.04814291000366211, 0.049910545349121094, 0.05167818069458008, 0.05344581604003906, 0.05521345138549805, 0.05698108673095703, 0.058748722076416016, 0.060516357421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 8.0, 11.0, 8.0, 13.0, 17.0, 16.0, 22.0, 22.0, 30.0, 40.0, 29.0, 29.0, 39.0, 40.0, 45.0, 39.0, 43.0, 54.0, 35.0, 57.0, 48.0, 43.0, 34.0, 27.0, 28.0, 43.0, 26.0, 25.0, 19.0, 14.0, 20.0, 8.0, 15.0, 8.0, 9.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08685302734375, -0.08446407318115234, -0.08207511901855469, -0.07968616485595703, -0.07729721069335938, -0.07490825653076172, -0.07251930236816406, -0.0701303482055664, -0.06774139404296875, -0.0653524398803711, -0.06296348571777344, -0.06057453155517578, -0.058185577392578125, -0.05579662322998047, -0.05340766906738281, -0.051018714904785156, -0.0486297607421875, -0.046240806579589844, -0.04385185241699219, -0.04146289825439453, -0.039073944091796875, -0.03668498992919922, -0.03429603576660156, -0.031907081604003906, -0.02951812744140625, -0.027129173278808594, -0.024740219116210938, -0.02235126495361328, -0.019962310791015625, -0.01757335662841797, -0.015184402465820312, -0.012795448303222656, -0.010406494140625, -0.008017539978027344, -0.0056285858154296875, -0.0032396316528320312, -0.000850677490234375, 0.0015382766723632812, 0.0039272308349609375, 0.006316184997558594, 0.00870513916015625, 0.011094093322753906, 0.013483047485351562, 0.01587200164794922, 0.018260955810546875, 0.02064990997314453, 0.023038864135742188, 0.025427818298339844, 0.0278167724609375, 0.030205726623535156, 0.03259468078613281, 0.03498363494873047, 0.037372589111328125, 0.03976154327392578, 0.04215049743652344, 0.044539451599121094, 0.04692840576171875, 0.049317359924316406, 0.05170631408691406, 0.05409526824951172, 0.056484222412109375, 0.05887317657470703, 0.06126213073730469, 0.06365108489990234, 0.0660400390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 16.0, 15.0, 23.0, 25.0, 31.0, 52.0, 71.0, 89.0, 135.0, 199.0, 257.0, 344.0, 547.0, 825.0, 1180.0, 1922.0, 3275.0, 6374.0, 14905.0, 42559.0, 149879.0, 407259.0, 287573.0, 83551.0, 25501.0, 9828.0, 4760.0, 2564.0, 1579.0, 982.0, 644.0, 416.0, 344.0, 213.0, 171.0, 112.0, 90.0, 62.0, 44.0, 30.0, 32.0, 18.0, 10.0, 11.0, 6.0, 9.0, 6.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.0198974609375, -0.01932525634765625, -0.0187530517578125, -0.01818084716796875, -0.017608642578125, -0.01703643798828125, -0.0164642333984375, -0.01589202880859375, -0.01531982421875, -0.01474761962890625, -0.0141754150390625, -0.01360321044921875, -0.013031005859375, -0.01245880126953125, -0.0118865966796875, -0.01131439208984375, -0.0107421875, -0.01016998291015625, -0.0095977783203125, -0.00902557373046875, -0.008453369140625, -0.00788116455078125, -0.0073089599609375, -0.00673675537109375, -0.00616455078125, -0.00559234619140625, -0.0050201416015625, -0.00444793701171875, -0.003875732421875, -0.00330352783203125, -0.0027313232421875, -0.00215911865234375, -0.0015869140625, -0.00101470947265625, -0.0004425048828125, 0.00012969970703125, 0.000701904296875, 0.00127410888671875, 0.0018463134765625, 0.00241851806640625, 0.00299072265625, 0.00356292724609375, 0.0041351318359375, 0.00470733642578125, 0.005279541015625, 0.00585174560546875, 0.0064239501953125, 0.00699615478515625, 0.007568359375, 0.00814056396484375, 0.0087127685546875, 0.00928497314453125, 0.009857177734375, 0.01042938232421875, 0.0110015869140625, 0.01157379150390625, 0.01214599609375, 0.01271820068359375, 0.0132904052734375, 0.01386260986328125, 0.014434814453125, 0.01500701904296875, 0.0155792236328125, 0.01615142822265625, 0.0167236328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 12.0, 21.0, 10.0, 21.0, 23.0, 28.0, 44.0, 36.0, 50.0, 47.0, 64.0, 75.0, 71.0, 44.0, 53.0, 65.0, 38.0, 57.0, 38.0, 26.0, 56.0, 15.0, 13.0, 16.0, 15.0, 9.0, 3.0, 3.0, 10.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.463859558105469e-06, -8.21240246295929e-06, -7.96094536781311e-06, -7.709488272666931e-06, -7.458031177520752e-06, -7.206574082374573e-06, -6.9551169872283936e-06, -6.703659892082214e-06, -6.452202796936035e-06, -6.200745701789856e-06, -5.949288606643677e-06, -5.6978315114974976e-06, -5.446374416351318e-06, -5.194917321205139e-06, -4.94346022605896e-06, -4.692003130912781e-06, -4.4405460357666016e-06, -4.189088940620422e-06, -3.937631845474243e-06, -3.686174750328064e-06, -3.4347176551818848e-06, -3.1832605600357056e-06, -2.9318034648895264e-06, -2.680346369743347e-06, -2.428889274597168e-06, -2.1774321794509888e-06, -1.9259750843048096e-06, -1.6745179891586304e-06, -1.4230608940124512e-06, -1.171603798866272e-06, -9.201467037200928e-07, -6.686896085739136e-07, -4.172325134277344e-07, -1.6577541828155518e-07, 8.568167686462402e-08, 3.371387720108032e-07, 5.885958671569824e-07, 8.400529623031616e-07, 1.0915100574493408e-06, 1.34296715259552e-06, 1.5944242477416992e-06, 1.8458813428878784e-06, 2.0973384380340576e-06, 2.348795533180237e-06, 2.600252628326416e-06, 2.8517097234725952e-06, 3.1031668186187744e-06, 3.3546239137649536e-06, 3.606081008911133e-06, 3.857538104057312e-06, 4.108995199203491e-06, 4.36045229434967e-06, 4.61190938949585e-06, 4.863366484642029e-06, 5.114823579788208e-06, 5.366280674934387e-06, 5.617737770080566e-06, 5.869194865226746e-06, 6.120651960372925e-06, 6.372109055519104e-06, 6.623566150665283e-06, 6.875023245811462e-06, 7.126480340957642e-06, 7.377937436103821e-06, 7.62939453125e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 11.0, 10.0, 15.0, 12.0, 14.0, 27.0, 48.0, 52.0, 98.0, 151.0, 240.0, 394.0, 575.0, 1037.0, 1971.0, 4339.0, 12062.0, 51806.0, 325383.0, 519783.0, 99323.0, 19342.0, 6046.0, 2529.0, 1297.0, 775.0, 403.0, 287.0, 160.0, 112.0, 76.0, 55.0, 38.0, 25.0, 20.0, 15.0, 8.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0299530029296875, -0.028992414474487305, -0.02803182601928711, -0.027071237564086914, -0.02611064910888672, -0.025150060653686523, -0.024189472198486328, -0.023228883743286133, -0.022268295288085938, -0.021307706832885742, -0.020347118377685547, -0.01938652992248535, -0.018425941467285156, -0.01746535301208496, -0.016504764556884766, -0.01554417610168457, -0.014583587646484375, -0.01362299919128418, -0.012662410736083984, -0.011701822280883789, -0.010741233825683594, -0.009780645370483398, -0.008820056915283203, -0.007859468460083008, -0.0068988800048828125, -0.005938291549682617, -0.004977703094482422, -0.0040171146392822266, -0.0030565261840820312, -0.002095937728881836, -0.0011353492736816406, -0.0001747608184814453, 0.00078582763671875, 0.0017464160919189453, 0.0027070045471191406, 0.003667593002319336, 0.004628181457519531, 0.0055887699127197266, 0.006549358367919922, 0.007509946823120117, 0.008470535278320312, 0.009431123733520508, 0.010391712188720703, 0.011352300643920898, 0.012312889099121094, 0.013273477554321289, 0.014234066009521484, 0.01519465446472168, 0.016155242919921875, 0.01711583137512207, 0.018076419830322266, 0.01903700828552246, 0.019997596740722656, 0.02095818519592285, 0.021918773651123047, 0.022879362106323242, 0.023839950561523438, 0.024800539016723633, 0.025761127471923828, 0.026721715927124023, 0.02768230438232422, 0.028642892837524414, 0.02960348129272461, 0.030564069747924805, 0.031524658203125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 4.0, 11.0, 7.0, 16.0, 31.0, 40.0, 56.0, 87.0, 101.0, 119.0, 114.0, 99.0, 71.0, 68.0, 55.0, 30.0, 28.0, 9.0, 12.0, 9.0, 7.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02423095703125, -0.023371219635009766, -0.02251148223876953, -0.021651744842529297, -0.020792007446289062, -0.019932270050048828, -0.019072532653808594, -0.01821279525756836, -0.017353057861328125, -0.01649332046508789, -0.015633583068847656, -0.014773845672607422, -0.013914108276367188, -0.013054370880126953, -0.012194633483886719, -0.011334896087646484, -0.01047515869140625, -0.009615421295166016, -0.008755683898925781, -0.007895946502685547, -0.0070362091064453125, -0.006176471710205078, -0.005316734313964844, -0.004456996917724609, -0.003597259521484375, -0.0027375221252441406, -0.0018777847290039062, -0.0010180473327636719, -0.0001583099365234375, 0.0007014274597167969, 0.0015611648559570312, 0.0024209022521972656, 0.0032806396484375, 0.004140377044677734, 0.005000114440917969, 0.005859851837158203, 0.0067195892333984375, 0.007579326629638672, 0.008439064025878906, 0.00929880142211914, 0.010158538818359375, 0.01101827621459961, 0.011878013610839844, 0.012737751007080078, 0.013597488403320312, 0.014457225799560547, 0.015316963195800781, 0.016176700592041016, 0.01703643798828125, 0.017896175384521484, 0.01875591278076172, 0.019615650177001953, 0.020475387573242188, 0.021335124969482422, 0.022194862365722656, 0.02305459976196289, 0.023914337158203125, 0.02477407455444336, 0.025633811950683594, 0.026493549346923828, 0.027353286743164062, 0.028213024139404297, 0.02907276153564453, 0.029932498931884766, 0.030792236328125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 8.0, 33.0, 531.0, 402.0, 40.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22229546308517456, -0.17703565955162048, -0.1317758411169052, -0.08651602268218994, -0.041256219148635864, 0.004003584384918213, 0.04926341772079468, 0.09452322125434875, 0.13978302478790283, 0.1850428283214569, 0.23030264675617218, 0.27556246519088745, 0.32082226872444153, 0.3660820722579956, 0.41134190559387207, 0.45660170912742615, 0.5018615126609802, 0.5471213459968567, 0.5923811197280884, 0.6376409530639648, 0.6829007863998413, 0.728160560131073, 0.7734203934669495, 0.8186801671981812, 0.8639400005340576, 0.9091998338699341, 0.9544596076011658, 0.9997194409370422, 1.044979214668274, 1.0902390480041504, 1.1354988813400269, 1.1807587146759033, 1.2260184288024902, 1.2712782621383667, 1.3165380954742432, 1.36179780960083, 1.4070576429367065, 1.452317476272583, 1.4975773096084595, 1.542837142944336, 1.5880968570709229, 1.6333566904067993, 1.6786165237426758, 1.7238762378692627, 1.7691360712051392, 1.8143959045410156, 1.859655737876892, 1.9049155712127686, 1.950175404548645, 1.9954352378845215, 2.0406949520111084, 2.0859549045562744, 2.1312146186828613, 2.1764745712280273, 2.2217342853546143, 2.266993999481201, 2.312253952026367, 2.357513666152954, 2.40277361869812, 2.448033332824707, 2.493293285369873, 2.53855299949646, 2.583812713623047, 2.629072666168213, 2.6743323802948]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 3.0, 6.0, 11.0, 16.0, 12.0, 16.0, 24.0, 17.0, 30.0, 24.0, 33.0, 32.0, 28.0, 46.0, 46.0, 39.0, 36.0, 36.0, 43.0, 44.0, 53.0, 43.0, 27.0, 58.0, 35.0, 34.0, 23.0, 33.0, 23.0, 18.0, 17.0, 12.0, 18.0, 12.0, 18.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.20782434940338135, -0.2012813687324524, -0.19473838806152344, -0.1881953924894333, -0.18165241181850433, -0.17510943114757538, -0.16856643557548523, -0.16202345490455627, -0.15548047423362732, -0.14893749356269836, -0.1423945128917694, -0.13585151731967926, -0.1293085366487503, -0.12276555597782135, -0.1162225678563118, -0.10967957973480225, -0.10313659906387329, -0.09659361839294434, -0.09005063027143478, -0.08350764214992523, -0.07696466147899628, -0.07042168080806732, -0.06387869268655777, -0.057335708290338516, -0.05079272389411926, -0.04424973949790001, -0.037706755101680756, -0.031163770705461502, -0.02462078630924225, -0.018077801913022995, -0.011534817516803741, -0.004991833120584488, 0.0015511512756347656, 0.00809413567185402, 0.014637120068073273, 0.021180104464292526, 0.02772308886051178, 0.03426607325673103, 0.04080905765295029, 0.04735204204916954, 0.053895026445388794, 0.06043801084160805, 0.0669809952378273, 0.07352398335933685, 0.08006696403026581, 0.08660994470119476, 0.09315293282270432, 0.09969592094421387, 0.10623890161514282, 0.11278188228607178, 0.11932487040758133, 0.12586785852909088, 0.13241083920001984, 0.1389538198709488, 0.14549681544303894, 0.1520397961139679, 0.15858277678489685, 0.1651257574558258, 0.17166873812675476, 0.1782117336988449, 0.18475471436977386, 0.19129769504070282, 0.19784069061279297, 0.20438367128372192, 0.21092665195465088]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 15.0, 20.0, 32.0, 44.0, 74.0, 133.0, 225.0, 432.0, 1048.0, 2806.0, 9931.0, 61728.0, 1665469.0, 2346663.0, 88857.0, 11611.0, 3207.0, 1144.0, 399.0, 196.0, 104.0, 50.0, 29.0, 21.0, 10.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.10980224609375, -0.10706138610839844, -0.10432052612304688, -0.10157966613769531, -0.09883880615234375, -0.09609794616699219, -0.09335708618164062, -0.09061622619628906, -0.0878753662109375, -0.08513450622558594, -0.08239364624023438, -0.07965278625488281, -0.07691192626953125, -0.07417106628417969, -0.07143020629882812, -0.06868934631347656, -0.065948486328125, -0.06320762634277344, -0.060466766357421875, -0.05772590637207031, -0.05498504638671875, -0.05224418640136719, -0.049503326416015625, -0.04676246643066406, -0.0440216064453125, -0.04128074645996094, -0.038539886474609375, -0.03579902648925781, -0.03305816650390625, -0.030317306518554688, -0.027576446533203125, -0.024835586547851562, -0.0220947265625, -0.019353866577148438, -0.016613006591796875, -0.013872146606445312, -0.01113128662109375, -0.008390426635742188, -0.005649566650390625, -0.0029087066650390625, -0.0001678466796875, 0.0025730133056640625, 0.005313873291015625, 0.008054733276367188, 0.01079559326171875, 0.013536453247070312, 0.016277313232421875, 0.019018173217773438, 0.021759033203125, 0.024499893188476562, 0.027240753173828125, 0.029981613159179688, 0.03272247314453125, 0.03546333312988281, 0.038204193115234375, 0.04094505310058594, 0.0436859130859375, 0.04642677307128906, 0.049167633056640625, 0.05190849304199219, 0.05464935302734375, 0.05739021301269531, 0.060131072998046875, 0.06287193298339844, 0.06561279296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 16.0, 26.0, 36.0, 51.0, 65.0, 113.0, 116.0, 148.0, 129.0, 107.0, 73.0, 44.0, 32.0, 21.0, 10.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0941162109375, -0.09137535095214844, -0.08863449096679688, -0.08589363098144531, -0.08315277099609375, -0.08041191101074219, -0.07767105102539062, -0.07493019104003906, -0.0721893310546875, -0.06944847106933594, -0.06670761108398438, -0.06396675109863281, -0.06122589111328125, -0.05848503112792969, -0.055744171142578125, -0.05300331115722656, -0.050262451171875, -0.04752159118652344, -0.044780731201171875, -0.04203987121582031, -0.03929901123046875, -0.03655815124511719, -0.033817291259765625, -0.031076431274414062, -0.0283355712890625, -0.025594711303710938, -0.022853851318359375, -0.020112991333007812, -0.01737213134765625, -0.014631271362304688, -0.011890411376953125, -0.009149551391601562, -0.00640869140625, -0.0036678314208984375, -0.000926971435546875, 0.0018138885498046875, 0.00455474853515625, 0.0072956085205078125, 0.010036468505859375, 0.012777328491210938, 0.0155181884765625, 0.018259048461914062, 0.020999908447265625, 0.023740768432617188, 0.02648162841796875, 0.029222488403320312, 0.031963348388671875, 0.03470420837402344, 0.037445068359375, 0.04018592834472656, 0.042926788330078125, 0.04566764831542969, 0.04840850830078125, 0.05114936828613281, 0.053890228271484375, 0.05663108825683594, 0.0593719482421875, 0.06211280822753906, 0.06485366821289062, 0.06759452819824219, 0.07033538818359375, 0.07307624816894531, 0.07581710815429688, 0.07855796813964844, 0.081298828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 6.0, 4.0, 8.0, 7.0, 12.0, 16.0, 21.0, 21.0, 30.0, 42.0, 52.0, 84.0, 166.0, 294.0, 590.0, 1303.0, 3418.0, 9741.0, 32727.0, 142444.0, 1116036.0, 2494462.0, 308095.0, 59483.0, 16116.0, 5309.0, 1950.0, 829.0, 409.0, 219.0, 111.0, 64.0, 42.0, 25.0, 27.0, 22.0, 10.0, 21.0, 6.0, 5.0, 13.0, 7.0, 5.0, 4.0, 7.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04425048828125, -0.04268217086791992, -0.041113853454589844, -0.039545536041259766, -0.03797721862792969, -0.03640890121459961, -0.03484058380126953, -0.03327226638793945, -0.031703948974609375, -0.030135631561279297, -0.02856731414794922, -0.02699899673461914, -0.025430679321289062, -0.023862361907958984, -0.022294044494628906, -0.020725727081298828, -0.01915740966796875, -0.017589092254638672, -0.016020774841308594, -0.014452457427978516, -0.012884140014648438, -0.01131582260131836, -0.009747505187988281, -0.008179187774658203, -0.006610870361328125, -0.005042552947998047, -0.0034742355346679688, -0.0019059181213378906, -0.0003376007080078125, 0.0012307167053222656, 0.0027990341186523438, 0.004367351531982422, 0.0059356689453125, 0.007503986358642578, 0.009072303771972656, 0.010640621185302734, 0.012208938598632812, 0.01377725601196289, 0.015345573425292969, 0.016913890838623047, 0.018482208251953125, 0.020050525665283203, 0.02161884307861328, 0.02318716049194336, 0.024755477905273438, 0.026323795318603516, 0.027892112731933594, 0.029460430145263672, 0.03102874755859375, 0.03259706497192383, 0.034165382385253906, 0.035733699798583984, 0.03730201721191406, 0.03887033462524414, 0.04043865203857422, 0.0420069694519043, 0.043575286865234375, 0.04514360427856445, 0.04671192169189453, 0.04828023910522461, 0.04984855651855469, 0.051416873931884766, 0.052985191345214844, 0.05455350875854492, 0.056121826171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 8.0, 19.0, 19.0, 39.0, 61.0, 95.0, 165.0, 247.0, 503.0, 754.0, 789.0, 565.0, 342.0, 170.0, 95.0, 57.0, 37.0, 26.0, 27.0, 14.0, 12.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048309326171875, -0.04670381546020508, -0.045098304748535156, -0.043492794036865234, -0.04188728332519531, -0.04028177261352539, -0.03867626190185547, -0.03707075119018555, -0.035465240478515625, -0.0338597297668457, -0.03225421905517578, -0.03064870834350586, -0.029043197631835938, -0.027437686920166016, -0.025832176208496094, -0.024226665496826172, -0.02262115478515625, -0.021015644073486328, -0.019410133361816406, -0.017804622650146484, -0.016199111938476562, -0.01459360122680664, -0.012988090515136719, -0.011382579803466797, -0.009777069091796875, -0.008171558380126953, -0.006566047668457031, -0.004960536956787109, -0.0033550262451171875, -0.0017495155334472656, -0.00014400482177734375, 0.0014615058898925781, 0.0030670166015625, 0.004672527313232422, 0.006278038024902344, 0.007883548736572266, 0.009489059448242188, 0.01109457015991211, 0.012700080871582031, 0.014305591583251953, 0.015911102294921875, 0.017516613006591797, 0.01912212371826172, 0.02072763442993164, 0.022333145141601562, 0.023938655853271484, 0.025544166564941406, 0.027149677276611328, 0.02875518798828125, 0.030360698699951172, 0.031966209411621094, 0.033571720123291016, 0.03517723083496094, 0.03678274154663086, 0.03838825225830078, 0.0399937629699707, 0.041599273681640625, 0.04320478439331055, 0.04481029510498047, 0.04641580581665039, 0.04802131652832031, 0.049626827239990234, 0.051232337951660156, 0.05283784866333008, 0.054443359375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 12.0, 21.0, 50.0, 81.0, 132.0, 168.0, 207.0, 127.0, 98.0, 40.0, 39.0, 12.0, 7.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12716475129127502, -0.11738310754299164, -0.10760146379470825, -0.09781982004642487, -0.08803817629814148, -0.0782565325498581, -0.06847488880157471, -0.05869324505329132, -0.048911601305007935, -0.03912995755672455, -0.029348313808441162, -0.019566670060157776, -0.00978502631187439, -3.382563591003418e-06, 0.009778261184692383, 0.01955990493297577, 0.029341548681259155, 0.03912319242954254, 0.04890483617782593, 0.058686479926109314, 0.0684681236743927, 0.07824976742267609, 0.08803141117095947, 0.09781305491924286, 0.10759469866752625, 0.11737634241580963, 0.12715798616409302, 0.1369396299123764, 0.1467212736606598, 0.15650291740894318, 0.16628456115722656, 0.17606620490550995, 0.18584787845611572, 0.1956295222043991, 0.2054111659526825, 0.21519280970096588, 0.22497445344924927, 0.23475609719753265, 0.24453774094581604, 0.25431936979293823, 0.2641010284423828, 0.2738826870918274, 0.2836643159389496, 0.2934459447860718, 0.30322760343551636, 0.31300926208496094, 0.32279089093208313, 0.3325725197792053, 0.3423541784286499, 0.3521358370780945, 0.3619174659252167, 0.37169909477233887, 0.38148075342178345, 0.391262412071228, 0.4010440409183502, 0.4108256697654724, 0.420607328414917, 0.4303889870643616, 0.44017061591148376, 0.44995224475860596, 0.45973390340805054, 0.4695155620574951, 0.4792971909046173, 0.4890788197517395, 0.4988604784011841]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 9.0, 6.0, 13.0, 20.0, 13.0, 27.0, 31.0, 30.0, 27.0, 28.0, 36.0, 42.0, 36.0, 39.0, 47.0, 54.0, 34.0, 47.0, 37.0, 38.0, 45.0, 43.0, 40.0, 40.0, 37.0, 27.0, 23.0, 23.0, 25.0, 18.0, 14.0, 8.0, 8.0, 7.0, 7.0, 4.0, 8.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.13960421085357666, -0.13575610518455505, -0.13190799951553345, -0.12805989384651184, -0.12421178072690964, -0.12036367505788803, -0.11651556193828583, -0.11266745626926422, -0.10881935060024261, -0.10497124493122101, -0.1011231392621994, -0.0972750261425972, -0.09342692047357559, -0.08957881480455399, -0.08573070168495178, -0.08188259601593018, -0.07803449034690857, -0.07418638467788696, -0.07033827900886536, -0.06649016588926315, -0.06264206022024155, -0.05879395455121994, -0.054945845156908035, -0.05109773576259613, -0.047249630093574524, -0.04340152442455292, -0.03955341503024101, -0.03570530563592911, -0.0318571999669075, -0.028009092435240746, -0.02416098490357399, -0.020312877371907234, -0.01646476984024048, -0.012616662308573723, -0.008768554776906967, -0.0049204472452402115, -0.0010723397135734558, 0.0027757678180933, 0.0066238753497600555, 0.010471982881426811, 0.014320090413093567, 0.018168197944760323, 0.022016305476427078, 0.025864413008093834, 0.02971252053976059, 0.033560626208782196, 0.0374087356030941, 0.041256844997406006, 0.04510495066642761, 0.04895305633544922, 0.052801165729761124, 0.05664927512407303, 0.060497380793094635, 0.06434548646211624, 0.06819359958171844, 0.07204170525074005, 0.07588981091976166, 0.07973791658878326, 0.08358602225780487, 0.08743413537740707, 0.09128224104642868, 0.09513034671545029, 0.09897845983505249, 0.1028265655040741, 0.1066746711730957]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 10.0, 12.0, 12.0, 26.0, 26.0, 51.0, 72.0, 110.0, 206.0, 326.0, 662.0, 1210.0, 3247.0, 11116.0, 53974.0, 277804.0, 520376.0, 141765.0, 27151.0, 6196.0, 2098.0, 893.0, 491.0, 269.0, 143.0, 80.0, 77.0, 56.0, 37.0, 21.0, 7.0, 8.0, 6.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0927734375, -0.09006786346435547, -0.08736228942871094, -0.0846567153930664, -0.08195114135742188, -0.07924556732177734, -0.07653999328613281, -0.07383441925048828, -0.07112884521484375, -0.06842327117919922, -0.06571769714355469, -0.06301212310791016, -0.060306549072265625, -0.057600975036621094, -0.05489540100097656, -0.05218982696533203, -0.0494842529296875, -0.04677867889404297, -0.04407310485839844, -0.041367530822753906, -0.038661956787109375, -0.035956382751464844, -0.03325080871582031, -0.03054523468017578, -0.02783966064453125, -0.02513408660888672, -0.022428512573242188, -0.019722938537597656, -0.017017364501953125, -0.014311790466308594, -0.011606216430664062, -0.008900642395019531, -0.006195068359375, -0.0034894943237304688, -0.0007839202880859375, 0.0019216537475585938, 0.004627227783203125, 0.007332801818847656, 0.010038375854492188, 0.012743949890136719, 0.01544952392578125, 0.01815509796142578, 0.020860671997070312, 0.023566246032714844, 0.026271820068359375, 0.028977394104003906, 0.03168296813964844, 0.03438854217529297, 0.0370941162109375, 0.03979969024658203, 0.04250526428222656, 0.045210838317871094, 0.047916412353515625, 0.050621986389160156, 0.05332756042480469, 0.05603313446044922, 0.05873870849609375, 0.06144428253173828, 0.06414985656738281, 0.06685543060302734, 0.06956100463867188, 0.0722665786743164, 0.07497215270996094, 0.07767772674560547, 0.08038330078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 4.0, 26.0, 19.0, 39.0, 69.0, 93.0, 113.0, 132.0, 131.0, 124.0, 91.0, 63.0, 41.0, 23.0, 17.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09454345703125, -0.09183883666992188, -0.08913421630859375, -0.08642959594726562, -0.0837249755859375, -0.08102035522460938, -0.07831573486328125, -0.07561111450195312, -0.072906494140625, -0.07020187377929688, -0.06749725341796875, -0.06479263305664062, -0.0620880126953125, -0.059383392333984375, -0.05667877197265625, -0.053974151611328125, -0.05126953125, -0.048564910888671875, -0.04586029052734375, -0.043155670166015625, -0.0404510498046875, -0.037746429443359375, -0.03504180908203125, -0.032337188720703125, -0.029632568359375, -0.026927947998046875, -0.02422332763671875, -0.021518707275390625, -0.0188140869140625, -0.016109466552734375, -0.01340484619140625, -0.010700225830078125, -0.00799560546875, -0.005290985107421875, -0.00258636474609375, 0.000118255615234375, 0.0028228759765625, 0.005527496337890625, 0.00823211669921875, 0.010936737060546875, 0.013641357421875, 0.016345977783203125, 0.01905059814453125, 0.021755218505859375, 0.0244598388671875, 0.027164459228515625, 0.02986907958984375, 0.032573699951171875, 0.0352783203125, 0.037982940673828125, 0.04068756103515625, 0.043392181396484375, 0.0460968017578125, 0.048801422119140625, 0.05150604248046875, 0.054210662841796875, 0.056915283203125, 0.059619903564453125, 0.06232452392578125, 0.06502914428710938, 0.0677337646484375, 0.07043838500976562, 0.07314300537109375, 0.07584762573242188, 0.07855224609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 8.0, 13.0, 14.0, 18.0, 28.0, 29.0, 33.0, 68.0, 75.0, 99.0, 161.0, 285.0, 517.0, 927.0, 2046.0, 4418.0, 9672.0, 22618.0, 53806.0, 129792.0, 278613.0, 295489.0, 144130.0, 60407.0, 25107.0, 10760.0, 4802.0, 2111.0, 1052.0, 512.0, 331.0, 153.0, 121.0, 82.0, 49.0, 48.0, 39.0, 19.0, 17.0, 14.0, 11.0, 8.0, 7.0, 3.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.03570556640625, -0.034517765045166016, -0.03332996368408203, -0.03214216232299805, -0.030954360961914062, -0.029766559600830078, -0.028578758239746094, -0.02739095687866211, -0.026203155517578125, -0.02501535415649414, -0.023827552795410156, -0.022639751434326172, -0.021451950073242188, -0.020264148712158203, -0.01907634735107422, -0.017888545989990234, -0.01670074462890625, -0.015512943267822266, -0.014325141906738281, -0.013137340545654297, -0.011949539184570312, -0.010761737823486328, -0.009573936462402344, -0.00838613510131836, -0.007198333740234375, -0.006010532379150391, -0.004822731018066406, -0.003634929656982422, -0.0024471282958984375, -0.0012593269348144531, -7.152557373046875e-05, 0.0011162757873535156, 0.0023040771484375, 0.0034918785095214844, 0.004679679870605469, 0.005867481231689453, 0.0070552825927734375, 0.008243083953857422, 0.009430885314941406, 0.01061868667602539, 0.011806488037109375, 0.01299428939819336, 0.014182090759277344, 0.015369892120361328, 0.016557693481445312, 0.017745494842529297, 0.01893329620361328, 0.020121097564697266, 0.02130889892578125, 0.022496700286865234, 0.02368450164794922, 0.024872303009033203, 0.026060104370117188, 0.027247905731201172, 0.028435707092285156, 0.02962350845336914, 0.030811309814453125, 0.03199911117553711, 0.033186912536621094, 0.03437471389770508, 0.03556251525878906, 0.03675031661987305, 0.03793811798095703, 0.039125919342041016, 0.040313720703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 9.0, 4.0, 5.0, 6.0, 6.0, 6.0, 13.0, 19.0, 13.0, 15.0, 16.0, 19.0, 17.0, 29.0, 17.0, 25.0, 37.0, 31.0, 35.0, 38.0, 35.0, 30.0, 50.0, 32.0, 34.0, 37.0, 30.0, 43.0, 37.0, 25.0, 30.0, 32.0, 27.0, 25.0, 32.0, 8.0, 23.0, 19.0, 12.0, 12.0, 14.0, 8.0, 11.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0556640625, -0.053888797760009766, -0.05211353302001953, -0.0503382682800293, -0.04856300354003906, -0.04678773880004883, -0.045012474060058594, -0.04323720932006836, -0.041461944580078125, -0.03968667984008789, -0.037911415100097656, -0.03613615036010742, -0.03436088562011719, -0.03258562088012695, -0.03081035614013672, -0.029035091400146484, -0.02725982666015625, -0.025484561920166016, -0.02370929718017578, -0.021934032440185547, -0.020158767700195312, -0.018383502960205078, -0.016608238220214844, -0.01483297348022461, -0.013057708740234375, -0.01128244400024414, -0.009507179260253906, -0.007731914520263672, -0.0059566497802734375, -0.004181385040283203, -0.0024061203002929688, -0.0006308555603027344, 0.0011444091796875, 0.0029196739196777344, 0.004694938659667969, 0.006470203399658203, 0.008245468139648438, 0.010020732879638672, 0.011795997619628906, 0.01357126235961914, 0.015346527099609375, 0.01712179183959961, 0.018897056579589844, 0.020672321319580078, 0.022447586059570312, 0.024222850799560547, 0.02599811553955078, 0.027773380279541016, 0.02954864501953125, 0.031323909759521484, 0.03309917449951172, 0.03487443923950195, 0.03664970397949219, 0.03842496871948242, 0.040200233459472656, 0.04197549819946289, 0.043750762939453125, 0.04552602767944336, 0.047301292419433594, 0.04907655715942383, 0.05085182189941406, 0.0526270866394043, 0.05440235137939453, 0.056177616119384766, 0.057952880859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 7.0, 9.0, 7.0, 10.0, 14.0, 23.0, 30.0, 60.0, 74.0, 122.0, 147.0, 263.0, 359.0, 639.0, 906.0, 1534.0, 2624.0, 4543.0, 8238.0, 16782.0, 36384.0, 85892.0, 212921.0, 348512.0, 187170.0, 75675.0, 32710.0, 14842.0, 7443.0, 4274.0, 2299.0, 1447.0, 901.0, 553.0, 386.0, 249.0, 156.0, 113.0, 55.0, 51.0, 35.0, 27.0, 20.0, 13.0, 14.0, 4.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 6.0, 0.0, 1.0], "bins": [-0.0135040283203125, -0.013087630271911621, -0.012671232223510742, -0.012254834175109863, -0.011838436126708984, -0.011422038078308105, -0.011005640029907227, -0.010589241981506348, -0.010172843933105469, -0.00975644588470459, -0.009340047836303711, -0.008923649787902832, -0.008507251739501953, -0.008090853691101074, -0.007674455642700195, -0.007258057594299316, -0.0068416595458984375, -0.006425261497497559, -0.00600886344909668, -0.005592465400695801, -0.005176067352294922, -0.004759669303894043, -0.004343271255493164, -0.003926873207092285, -0.0035104751586914062, -0.0030940771102905273, -0.0026776790618896484, -0.0022612810134887695, -0.0018448829650878906, -0.0014284849166870117, -0.0010120868682861328, -0.0005956888198852539, -0.000179290771484375, 0.0002371072769165039, 0.0006535053253173828, 0.0010699033737182617, 0.0014863014221191406, 0.0019026994705200195, 0.0023190975189208984, 0.0027354955673217773, 0.0031518936157226562, 0.003568291664123535, 0.003984689712524414, 0.004401087760925293, 0.004817485809326172, 0.005233883857727051, 0.00565028190612793, 0.006066679954528809, 0.0064830780029296875, 0.006899476051330566, 0.007315874099731445, 0.007732272148132324, 0.008148670196533203, 0.008565068244934082, 0.008981466293334961, 0.00939786434173584, 0.009814262390136719, 0.010230660438537598, 0.010647058486938477, 0.011063456535339355, 0.011479854583740234, 0.011896252632141113, 0.012312650680541992, 0.012729048728942871, 0.01314544677734375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 9.0, 2.0, 7.0, 4.0, 15.0, 15.0, 18.0, 19.0, 21.0, 30.0, 23.0, 36.0, 26.0, 43.0, 72.0, 37.0, 51.0, 59.0, 40.0, 55.0, 50.0, 40.0, 42.0, 35.0, 39.0, 34.0, 27.0, 25.0, 30.0, 17.0, 19.0, 19.0, 6.0, 9.0, 2.0, 6.0, 2.0, 9.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.854534149169922e-06, -6.654299795627594e-06, -6.454065442085266e-06, -6.253831088542938e-06, -6.05359673500061e-06, -5.8533623814582825e-06, -5.653128027915955e-06, -5.452893674373627e-06, -5.252659320831299e-06, -5.052424967288971e-06, -4.852190613746643e-06, -4.651956260204315e-06, -4.451721906661987e-06, -4.2514875531196594e-06, -4.0512531995773315e-06, -3.851018846035004e-06, -3.6507844924926758e-06, -3.450550138950348e-06, -3.25031578540802e-06, -3.050081431865692e-06, -2.8498470783233643e-06, -2.6496127247810364e-06, -2.4493783712387085e-06, -2.2491440176963806e-06, -2.0489096641540527e-06, -1.8486753106117249e-06, -1.648440957069397e-06, -1.448206603527069e-06, -1.2479722499847412e-06, -1.0477378964424133e-06, -8.475035429000854e-07, -6.472691893577576e-07, -4.470348358154297e-07, -2.468004822731018e-07, -4.6566128730773926e-08, 1.5366822481155396e-07, 3.5390257835388184e-07, 5.541369318962097e-07, 7.543712854385376e-07, 9.546056389808655e-07, 1.1548399925231934e-06, 1.3550743460655212e-06, 1.5553086996078491e-06, 1.755543053150177e-06, 1.955777406692505e-06, 2.1560117602348328e-06, 2.3562461137771606e-06, 2.5564804673194885e-06, 2.7567148208618164e-06, 2.9569491744041443e-06, 3.157183527946472e-06, 3.3574178814888e-06, 3.557652235031128e-06, 3.757886588573456e-06, 3.958120942115784e-06, 4.1583552956581116e-06, 4.3585896492004395e-06, 4.558824002742767e-06, 4.759058356285095e-06, 4.959292709827423e-06, 5.159527063369751e-06, 5.359761416912079e-06, 5.559995770454407e-06, 5.760230123996735e-06, 5.9604644775390625e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 3.0, 12.0, 14.0, 30.0, 59.0, 72.0, 147.0, 244.0, 519.0, 955.0, 2191.0, 5756.0, 18261.0, 82148.0, 486444.0, 368943.0, 59779.0, 14467.0, 4684.0, 1923.0, 926.0, 425.0, 220.0, 132.0, 81.0, 44.0, 23.0, 14.0, 9.0, 9.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0338134765625, -0.03284478187561035, -0.0318760871887207, -0.030907392501831055, -0.029938697814941406, -0.028970003128051758, -0.02800130844116211, -0.02703261375427246, -0.026063919067382812, -0.025095224380493164, -0.024126529693603516, -0.023157835006713867, -0.02218914031982422, -0.02122044563293457, -0.020251750946044922, -0.019283056259155273, -0.018314361572265625, -0.017345666885375977, -0.016376972198486328, -0.01540827751159668, -0.014439582824707031, -0.013470888137817383, -0.012502193450927734, -0.011533498764038086, -0.010564804077148438, -0.009596109390258789, -0.00862741470336914, -0.007658720016479492, -0.006690025329589844, -0.005721330642700195, -0.004752635955810547, -0.0037839412689208984, -0.00281524658203125, -0.0018465518951416016, -0.0008778572082519531, 9.083747863769531e-05, 0.0010595321655273438, 0.002028226852416992, 0.0029969215393066406, 0.003965616226196289, 0.0049343109130859375, 0.005903005599975586, 0.006871700286865234, 0.007840394973754883, 0.008809089660644531, 0.00977778434753418, 0.010746479034423828, 0.011715173721313477, 0.012683868408203125, 0.013652563095092773, 0.014621257781982422, 0.01558995246887207, 0.01655864715576172, 0.017527341842651367, 0.018496036529541016, 0.019464731216430664, 0.020433425903320312, 0.02140212059020996, 0.02237081527709961, 0.023339509963989258, 0.024308204650878906, 0.025276899337768555, 0.026245594024658203, 0.02721428871154785, 0.0281829833984375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 4.0, 18.0, 8.0, 18.0, 26.0, 25.0, 43.0, 50.0, 69.0, 97.0, 133.0, 149.0, 109.0, 85.0, 54.0, 30.0, 26.0, 14.0, 7.0, 11.0, 4.0, 6.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0238800048828125, -0.023084640502929688, -0.022289276123046875, -0.021493911743164062, -0.02069854736328125, -0.019903182983398438, -0.019107818603515625, -0.018312454223632812, -0.01751708984375, -0.016721725463867188, -0.015926361083984375, -0.015130996704101562, -0.01433563232421875, -0.013540267944335938, -0.012744903564453125, -0.011949539184570312, -0.0111541748046875, -0.010358810424804688, -0.009563446044921875, -0.008768081665039062, -0.00797271728515625, -0.0071773529052734375, -0.006381988525390625, -0.0055866241455078125, -0.004791259765625, -0.0039958953857421875, -0.003200531005859375, -0.0024051666259765625, -0.00160980224609375, -0.0008144378662109375, -1.9073486328125e-05, 0.0007762908935546875, 0.0015716552734375, 0.0023670196533203125, 0.003162384033203125, 0.0039577484130859375, 0.00475311279296875, 0.0055484771728515625, 0.006343841552734375, 0.0071392059326171875, 0.0079345703125, 0.008729934692382812, 0.009525299072265625, 0.010320663452148438, 0.01111602783203125, 0.011911392211914062, 0.012706756591796875, 0.013502120971679688, 0.0142974853515625, 0.015092849731445312, 0.015888214111328125, 0.016683578491210938, 0.01747894287109375, 0.018274307250976562, 0.019069671630859375, 0.019865036010742188, 0.020660400390625, 0.021455764770507812, 0.022251129150390625, 0.023046493530273438, 0.02384185791015625, 0.024637222290039062, 0.025432586669921875, 0.026227951049804688, 0.0270233154296875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 12.0, 165.0, 577.0, 205.0, 38.0, 9.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.649794578552246, -1.6189637184143066, -1.5881328582763672, -1.5573018789291382, -1.5264710187911987, -1.4956401586532593, -1.4648092985153198, -1.4339783191680908, -1.4031474590301514, -1.372316598892212, -1.3414857387542725, -1.3106547594070435, -1.279823899269104, -1.2489930391311646, -1.218162178993225, -1.187331199645996, -1.1565003395080566, -1.1256694793701172, -1.0948386192321777, -1.0640076398849487, -1.0331767797470093, -1.0023459196090698, -0.9715149998664856, -0.9406841397285461, -0.9098532795906067, -0.8790224194526672, -0.848191499710083, -0.8173606395721436, -0.7865297198295593, -0.7556988596916199, -0.7248679399490356, -0.6940370798110962, -0.663206160068512, -0.6323752999305725, -0.6015443801879883, -0.5707135200500488, -0.5398826003074646, -0.5090517401695251, -0.4782208204269409, -0.44738996028900146, -0.41655904054641724, -0.3857281506061554, -0.35489726066589355, -0.3240663707256317, -0.2932354807853699, -0.2624046206474304, -0.23157371580600739, -0.20074282586574554, -0.1699119508266449, -0.13908106088638306, -0.10825017094612122, -0.07741928845643997, -0.04658839851617813, -0.015757516026496887, 0.015073373913764954, 0.045904263854026794, 0.07673515379428864, 0.10756604373455048, 0.13839693367481232, 0.16922780871391296, 0.2000586986541748, 0.23088958859443665, 0.2617204785346985, 0.2925513684749603, 0.32338225841522217]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 7.0, 9.0, 13.0, 7.0, 14.0, 19.0, 19.0, 20.0, 20.0, 31.0, 17.0, 24.0, 25.0, 44.0, 47.0, 42.0, 32.0, 44.0, 42.0, 40.0, 46.0, 33.0, 42.0, 38.0, 42.0, 32.0, 34.0, 25.0, 23.0, 25.0, 29.0, 14.0, 16.0, 11.0, 11.0, 10.0, 9.0, 6.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14031648635864258, -0.1355638951063156, -0.13081130385398865, -0.12605871260166168, -0.12130612879991531, -0.11655353754758835, -0.11180095374584198, -0.10704836249351501, -0.10229577124118805, -0.09754317998886108, -0.09279058873653412, -0.08803800493478775, -0.08328541368246078, -0.07853282243013382, -0.07378023862838745, -0.06902764737606049, -0.06427505612373352, -0.059522464871406555, -0.05476987734436989, -0.05001728981733322, -0.045264698565006256, -0.04051210731267929, -0.035759519785642624, -0.031006932258605957, -0.02625434100627899, -0.021501751616597176, -0.01674916222691536, -0.011996572837233543, -0.007243983447551727, -0.002491394057869911, 0.002261195331811905, 0.007013782858848572, 0.011766374111175537, 0.016518963500857353, 0.02127155289053917, 0.026024142280220985, 0.0307767316699028, 0.03552932292222977, 0.040281910449266434, 0.0450344979763031, 0.049787089228630066, 0.05453968048095703, 0.0592922680079937, 0.06404485553503036, 0.06879744678735733, 0.0735500380396843, 0.07830262184143066, 0.08305521309375763, 0.0878078043460846, 0.09256039559841156, 0.09731298685073853, 0.1020655706524849, 0.10681816190481186, 0.11157075315713882, 0.11632333695888519, 0.12107592821121216, 0.12582851946353912, 0.1305811107158661, 0.13533370196819305, 0.14008629322052002, 0.1448388695716858, 0.14959146082401276, 0.15434405207633972, 0.1590966433286667, 0.16384923458099365]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 11.0, 13.0, 21.0, 35.0, 64.0, 128.0, 293.0, 890.0, 4281.0, 49371.0, 3723156.0, 402732.0, 10952.0, 1661.0, 393.0, 147.0, 66.0, 35.0, 14.0, 12.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1915283203125, -0.18693828582763672, -0.18234825134277344, -0.17775821685791016, -0.17316818237304688, -0.1685781478881836, -0.1639881134033203, -0.15939807891845703, -0.15480804443359375, -0.15021800994873047, -0.1456279754638672, -0.1410379409790039, -0.13644790649414062, -0.13185787200927734, -0.12726783752441406, -0.12267780303955078, -0.1180877685546875, -0.11349773406982422, -0.10890769958496094, -0.10431766510009766, -0.09972763061523438, -0.0951375961303711, -0.09054756164550781, -0.08595752716064453, -0.08136749267578125, -0.07677745819091797, -0.07218742370605469, -0.0675973892211914, -0.06300735473632812, -0.058417320251464844, -0.05382728576660156, -0.04923725128173828, -0.044647216796875, -0.04005718231201172, -0.03546714782714844, -0.030877113342285156, -0.026287078857421875, -0.021697044372558594, -0.017107009887695312, -0.012516975402832031, -0.00792694091796875, -0.0033369064331054688, 0.0012531280517578125, 0.005843162536621094, 0.010433197021484375, 0.015023231506347656, 0.019613265991210938, 0.02420330047607422, 0.0287933349609375, 0.03338336944580078, 0.03797340393066406, 0.042563438415527344, 0.047153472900390625, 0.051743507385253906, 0.05633354187011719, 0.06092357635498047, 0.06551361083984375, 0.07010364532470703, 0.07469367980957031, 0.0792837142944336, 0.08387374877929688, 0.08846378326416016, 0.09305381774902344, 0.09764385223388672, 0.10223388671875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 14.0, 8.0, 16.0, 47.0, 46.0, 88.0, 97.0, 140.0, 141.0, 127.0, 105.0, 71.0, 49.0, 29.0, 15.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0946044921875, -0.09192085266113281, -0.08923721313476562, -0.08655357360839844, -0.08386993408203125, -0.08118629455566406, -0.07850265502929688, -0.07581901550292969, -0.0731353759765625, -0.07045173645019531, -0.06776809692382812, -0.06508445739746094, -0.06240081787109375, -0.05971717834472656, -0.057033538818359375, -0.05434989929199219, -0.051666259765625, -0.04898262023925781, -0.046298980712890625, -0.04361534118652344, -0.04093170166015625, -0.03824806213378906, -0.035564422607421875, -0.03288078308105469, -0.0301971435546875, -0.027513504028320312, -0.024829864501953125, -0.022146224975585938, -0.01946258544921875, -0.016778945922851562, -0.014095306396484375, -0.011411666870117188, -0.00872802734375, -0.0060443878173828125, -0.003360748291015625, -0.0006771087646484375, 0.00200653076171875, 0.0046901702880859375, 0.007373809814453125, 0.010057449340820312, 0.0127410888671875, 0.015424728393554688, 0.018108367919921875, 0.020792007446289062, 0.02347564697265625, 0.026159286499023438, 0.028842926025390625, 0.03152656555175781, 0.034210205078125, 0.03689384460449219, 0.039577484130859375, 0.04226112365722656, 0.04494476318359375, 0.04762840270996094, 0.050312042236328125, 0.05299568176269531, 0.0556793212890625, 0.05836296081542969, 0.061046600341796875, 0.06373023986816406, 0.06641387939453125, 0.06909751892089844, 0.07178115844726562, 0.07446479797363281, 0.0771484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 8.0, 8.0, 20.0, 25.0, 27.0, 35.0, 56.0, 105.0, 122.0, 209.0, 362.0, 560.0, 998.0, 1708.0, 3367.0, 6843.0, 15079.0, 35697.0, 94423.0, 316004.0, 1686934.0, 1580772.0, 297856.0, 90677.0, 34404.0, 14158.0, 6662.0, 3040.0, 1652.0, 968.0, 526.0, 343.0, 210.0, 147.0, 93.0, 67.0, 40.0, 21.0, 17.0, 13.0, 10.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.040924072265625, -0.03981733322143555, -0.038710594177246094, -0.03760385513305664, -0.03649711608886719, -0.035390377044677734, -0.03428363800048828, -0.03317689895629883, -0.032070159912109375, -0.030963420867919922, -0.02985668182373047, -0.028749942779541016, -0.027643203735351562, -0.02653646469116211, -0.025429725646972656, -0.024322986602783203, -0.02321624755859375, -0.022109508514404297, -0.021002769470214844, -0.01989603042602539, -0.018789291381835938, -0.017682552337646484, -0.01657581329345703, -0.015469074249267578, -0.014362335205078125, -0.013255596160888672, -0.012148857116699219, -0.011042118072509766, -0.009935379028320312, -0.00882863998413086, -0.007721900939941406, -0.006615161895751953, -0.0055084228515625, -0.004401683807373047, -0.0032949447631835938, -0.0021882057189941406, -0.0010814666748046875, 2.5272369384765625e-05, 0.0011320114135742188, 0.002238750457763672, 0.003345489501953125, 0.004452228546142578, 0.005558967590332031, 0.006665706634521484, 0.0077724456787109375, 0.00887918472290039, 0.009985923767089844, 0.011092662811279297, 0.01219940185546875, 0.013306140899658203, 0.014412879943847656, 0.01551961898803711, 0.016626358032226562, 0.017733097076416016, 0.01883983612060547, 0.019946575164794922, 0.021053314208984375, 0.022160053253173828, 0.02326679229736328, 0.024373531341552734, 0.025480270385742188, 0.02658700942993164, 0.027693748474121094, 0.028800487518310547, 0.0299072265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 7.0, 11.0, 11.0, 25.0, 20.0, 35.0, 59.0, 84.0, 116.0, 193.0, 339.0, 607.0, 819.0, 725.0, 389.0, 218.0, 125.0, 76.0, 65.0, 55.0, 28.0, 16.0, 11.0, 14.0, 10.0, 1.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045074462890625, -0.0435490608215332, -0.042023658752441406, -0.04049825668334961, -0.03897285461425781, -0.037447452545166016, -0.03592205047607422, -0.03439664840698242, -0.032871246337890625, -0.03134584426879883, -0.02982044219970703, -0.028295040130615234, -0.026769638061523438, -0.02524423599243164, -0.023718833923339844, -0.022193431854248047, -0.02066802978515625, -0.019142627716064453, -0.017617225646972656, -0.01609182357788086, -0.014566421508789062, -0.013041019439697266, -0.011515617370605469, -0.009990215301513672, -0.008464813232421875, -0.006939411163330078, -0.005414009094238281, -0.0038886070251464844, -0.0023632049560546875, -0.0008378028869628906, 0.0006875991821289062, 0.002213001251220703, 0.0037384033203125, 0.005263805389404297, 0.006789207458496094, 0.00831460952758789, 0.009840011596679688, 0.011365413665771484, 0.012890815734863281, 0.014416217803955078, 0.015941619873046875, 0.017467021942138672, 0.01899242401123047, 0.020517826080322266, 0.022043228149414062, 0.02356863021850586, 0.025094032287597656, 0.026619434356689453, 0.02814483642578125, 0.029670238494873047, 0.031195640563964844, 0.03272104263305664, 0.03424644470214844, 0.035771846771240234, 0.03729724884033203, 0.03882265090942383, 0.040348052978515625, 0.04187345504760742, 0.04339885711669922, 0.044924259185791016, 0.04644966125488281, 0.04797506332397461, 0.049500465393066406, 0.0510258674621582, 0.05255126953125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 18.0, 28.0, 49.0, 112.0, 116.0, 179.0, 193.0, 124.0, 85.0, 47.0, 26.0, 10.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4807577133178711, -0.47068750858306885, -0.4606173038482666, -0.45054709911346436, -0.4404768943786621, -0.43040668964385986, -0.4203364849090576, -0.41026628017425537, -0.4001960754394531, -0.3901258707046509, -0.38005566596984863, -0.3699854612350464, -0.35991525650024414, -0.3498450517654419, -0.33977484703063965, -0.3297046422958374, -0.31963446736335754, -0.3095642626285553, -0.29949405789375305, -0.2894238531589508, -0.27935364842414856, -0.2692834436893463, -0.25921323895454407, -0.24914304912090302, -0.23907284438610077, -0.22900263965129852, -0.21893243491649628, -0.20886223018169403, -0.19879204034805298, -0.18872183561325073, -0.1786516308784485, -0.16858142614364624, -0.15851125121116638, -0.14844104647636414, -0.1383708417415619, -0.12830063700675964, -0.118230439722538, -0.10816023498773575, -0.0980900377035141, -0.08801983296871185, -0.0779496282339096, -0.06787942349910736, -0.05780922248959541, -0.047739021480083466, -0.03766881674528122, -0.027598612010478973, -0.017528411000967026, -0.007458209991455078, 0.002611994743347168, 0.012682197615504265, 0.02275240048766136, 0.03282260149717331, 0.042892806231975555, 0.0529630109667778, 0.06303320825099945, 0.0731034129858017, 0.08317361772060394, 0.09324382245540619, 0.10331402719020844, 0.11338422447443008, 0.12345442920923233, 0.13352462649345398, 0.14359483122825623, 0.15366503596305847, 0.16373524069786072]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 3.0, 7.0, 4.0, 8.0, 12.0, 20.0, 14.0, 13.0, 22.0, 20.0, 21.0, 26.0, 35.0, 36.0, 25.0, 35.0, 37.0, 40.0, 42.0, 47.0, 37.0, 39.0, 46.0, 29.0, 43.0, 37.0, 37.0, 21.0, 19.0, 20.0, 25.0, 35.0, 20.0, 14.0, 12.0, 12.0, 12.0, 16.0, 11.0, 3.0, 8.0, 4.0, 3.0, 8.0, 6.0, 4.0, 1.0, 3.0, 7.0, 0.0, 0.0, 1.0], "bins": [-0.10535866022109985, -0.10217900574207306, -0.09899934381246567, -0.09581968188285828, -0.09264002740383148, -0.08946037292480469, -0.0862807109951973, -0.0831010490655899, -0.07992139458656311, -0.07674174010753632, -0.07356207817792892, -0.07038241624832153, -0.06720276176929474, -0.06402310729026794, -0.06084344536066055, -0.05766378715634346, -0.05448412895202637, -0.051304470747709274, -0.04812481254339218, -0.04494515433907509, -0.041765496134757996, -0.0385858379304409, -0.03540617972612381, -0.03222652152180672, -0.029046863317489624, -0.02586720511317253, -0.022687546908855438, -0.019507888704538345, -0.016328230500221252, -0.01314857229590416, -0.009968914091587067, -0.006789255887269974, -0.003609597682952881, -0.00042993947863578796, 0.002749718725681305, 0.005929376929998398, 0.00910903513431549, 0.012288693338632584, 0.015468351542949677, 0.01864800974726677, 0.021827667951583862, 0.025007326155900955, 0.028186984360218048, 0.03136664256453514, 0.034546300768852234, 0.03772595897316933, 0.04090561717748642, 0.04408527538180351, 0.047264933586120605, 0.0504445917904377, 0.05362424999475479, 0.056803908199071884, 0.05998356640338898, 0.06316322088241577, 0.06634288281202316, 0.06952254474163055, 0.07270219922065735, 0.07588185369968414, 0.07906151562929153, 0.08224117755889893, 0.08542083203792572, 0.08860048651695251, 0.0917801484465599, 0.0949598103761673, 0.09813946485519409]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 7.0, 5.0, 12.0, 10.0, 18.0, 25.0, 38.0, 50.0, 61.0, 85.0, 124.0, 194.0, 363.0, 640.0, 1365.0, 3456.0, 11067.0, 45645.0, 223218.0, 539473.0, 171999.0, 35838.0, 9221.0, 2957.0, 1167.0, 559.0, 317.0, 202.0, 139.0, 82.0, 75.0, 41.0, 24.0, 21.0, 15.0, 8.0, 8.0, 9.0, 5.0, 5.0, 0.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.09039306640625, -0.08784103393554688, -0.08528900146484375, -0.08273696899414062, -0.0801849365234375, -0.07763290405273438, -0.07508087158203125, -0.07252883911132812, -0.069976806640625, -0.06742477416992188, -0.06487274169921875, -0.062320709228515625, -0.0597686767578125, -0.057216644287109375, -0.05466461181640625, -0.052112579345703125, -0.049560546875, -0.047008514404296875, -0.04445648193359375, -0.041904449462890625, -0.0393524169921875, -0.036800384521484375, -0.03424835205078125, -0.031696319580078125, -0.029144287109375, -0.026592254638671875, -0.02404022216796875, -0.021488189697265625, -0.0189361572265625, -0.016384124755859375, -0.01383209228515625, -0.011280059814453125, -0.00872802734375, -0.006175994873046875, -0.00362396240234375, -0.001071929931640625, 0.0014801025390625, 0.004032135009765625, 0.00658416748046875, 0.009136199951171875, 0.011688232421875, 0.014240264892578125, 0.01679229736328125, 0.019344329833984375, 0.0218963623046875, 0.024448394775390625, 0.02700042724609375, 0.029552459716796875, 0.0321044921875, 0.034656524658203125, 0.03720855712890625, 0.039760589599609375, 0.0423126220703125, 0.044864654541015625, 0.04741668701171875, 0.049968719482421875, 0.052520751953125, 0.055072784423828125, 0.05762481689453125, 0.060176849365234375, 0.0627288818359375, 0.06528091430664062, 0.06783294677734375, 0.07038497924804688, 0.07293701171875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 9.0, 9.0, 28.0, 50.0, 73.0, 97.0, 116.0, 137.0, 133.0, 109.0, 97.0, 69.0, 33.0, 21.0, 9.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09429931640625, -0.09159183502197266, -0.08888435363769531, -0.08617687225341797, -0.08346939086914062, -0.08076190948486328, -0.07805442810058594, -0.0753469467163086, -0.07263946533203125, -0.0699319839477539, -0.06722450256347656, -0.06451702117919922, -0.061809539794921875, -0.05910205841064453, -0.05639457702636719, -0.053687095642089844, -0.0509796142578125, -0.048272132873535156, -0.04556465148925781, -0.04285717010498047, -0.040149688720703125, -0.03744220733642578, -0.03473472595214844, -0.032027244567871094, -0.02931976318359375, -0.026612281799316406, -0.023904800415039062, -0.02119731903076172, -0.018489837646484375, -0.01578235626220703, -0.013074874877929688, -0.010367393493652344, -0.007659912109375, -0.004952430725097656, -0.0022449493408203125, 0.00046253204345703125, 0.003170013427734375, 0.005877494812011719, 0.008584976196289062, 0.011292457580566406, 0.01399993896484375, 0.016707420349121094, 0.019414901733398438, 0.02212238311767578, 0.024829864501953125, 0.02753734588623047, 0.030244827270507812, 0.032952308654785156, 0.0356597900390625, 0.038367271423339844, 0.04107475280761719, 0.04378223419189453, 0.046489715576171875, 0.04919719696044922, 0.05190467834472656, 0.054612159729003906, 0.05731964111328125, 0.060027122497558594, 0.06273460388183594, 0.06544208526611328, 0.06814956665039062, 0.07085704803466797, 0.07356452941894531, 0.07627201080322266, 0.0789794921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 10.0, 16.0, 8.0, 20.0, 27.0, 42.0, 38.0, 98.0, 153.0, 226.0, 400.0, 830.0, 1558.0, 3228.0, 6654.0, 14178.0, 31474.0, 72291.0, 166977.0, 300309.0, 244754.0, 114725.0, 49367.0, 21707.0, 9879.0, 4673.0, 2286.0, 1114.0, 625.0, 354.0, 193.0, 103.0, 67.0, 44.0, 34.0, 29.0, 14.0, 11.0, 10.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.03570556640625, -0.034581661224365234, -0.03345775604248047, -0.0323338508605957, -0.031209945678710938, -0.030086040496826172, -0.028962135314941406, -0.02783823013305664, -0.026714324951171875, -0.02559041976928711, -0.024466514587402344, -0.023342609405517578, -0.022218704223632812, -0.021094799041748047, -0.01997089385986328, -0.018846988677978516, -0.01772308349609375, -0.016599178314208984, -0.015475273132324219, -0.014351367950439453, -0.013227462768554688, -0.012103557586669922, -0.010979652404785156, -0.00985574722290039, -0.008731842041015625, -0.007607936859130859, -0.006484031677246094, -0.005360126495361328, -0.0042362213134765625, -0.003112316131591797, -0.0019884109497070312, -0.0008645057678222656, 0.0002593994140625, 0.0013833045959472656, 0.0025072097778320312, 0.003631114959716797, 0.0047550201416015625, 0.005878925323486328, 0.007002830505371094, 0.00812673568725586, 0.009250640869140625, 0.01037454605102539, 0.011498451232910156, 0.012622356414794922, 0.013746261596679688, 0.014870166778564453, 0.01599407196044922, 0.017117977142333984, 0.01824188232421875, 0.019365787506103516, 0.02048969268798828, 0.021613597869873047, 0.022737503051757812, 0.023861408233642578, 0.024985313415527344, 0.02610921859741211, 0.027233123779296875, 0.02835702896118164, 0.029480934143066406, 0.030604839324951172, 0.03172874450683594, 0.0328526496887207, 0.03397655487060547, 0.035100460052490234, 0.036224365234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 8.0, 9.0, 8.0, 4.0, 9.0, 15.0, 17.0, 28.0, 25.0, 19.0, 37.0, 35.0, 32.0, 49.0, 51.0, 57.0, 59.0, 56.0, 56.0, 52.0, 53.0, 37.0, 31.0, 29.0, 32.0, 38.0, 33.0, 21.0, 16.0, 22.0, 15.0, 11.0, 7.0, 8.0, 7.0, 4.0, 3.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.095703125, -0.09309959411621094, -0.09049606323242188, -0.08789253234863281, -0.08528900146484375, -0.08268547058105469, -0.08008193969726562, -0.07747840881347656, -0.0748748779296875, -0.07227134704589844, -0.06966781616210938, -0.06706428527832031, -0.06446075439453125, -0.06185722351074219, -0.059253692626953125, -0.05665016174316406, -0.054046630859375, -0.05144309997558594, -0.048839569091796875, -0.04623603820800781, -0.04363250732421875, -0.04102897644042969, -0.038425445556640625, -0.03582191467285156, -0.0332183837890625, -0.030614852905273438, -0.028011322021484375, -0.025407791137695312, -0.02280426025390625, -0.020200729370117188, -0.017597198486328125, -0.014993667602539062, -0.01239013671875, -0.009786605834960938, -0.007183074951171875, -0.0045795440673828125, -0.00197601318359375, 0.0006275177001953125, 0.003231048583984375, 0.0058345794677734375, 0.0084381103515625, 0.011041641235351562, 0.013645172119140625, 0.016248703002929688, 0.01885223388671875, 0.021455764770507812, 0.024059295654296875, 0.026662826538085938, 0.029266357421875, 0.03186988830566406, 0.034473419189453125, 0.03707695007324219, 0.03968048095703125, 0.04228401184082031, 0.044887542724609375, 0.04749107360839844, 0.0500946044921875, 0.05269813537597656, 0.055301666259765625, 0.05790519714355469, 0.06050872802734375, 0.06311225891113281, 0.06571578979492188, 0.06831932067871094, 0.0709228515625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 4.0, 14.0, 19.0, 30.0, 36.0, 54.0, 76.0, 109.0, 160.0, 269.0, 421.0, 628.0, 1059.0, 1733.0, 3150.0, 6334.0, 14763.0, 38593.0, 125577.0, 366264.0, 326676.0, 104342.0, 32670.0, 12824.0, 5686.0, 2784.0, 1598.0, 919.0, 543.0, 381.0, 279.0, 176.0, 121.0, 92.0, 55.0, 39.0, 25.0, 17.0, 9.0, 9.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01873779296875, -0.01816868782043457, -0.01759958267211914, -0.01703047752380371, -0.01646137237548828, -0.01589226722717285, -0.015323162078857422, -0.014754056930541992, -0.014184951782226562, -0.013615846633911133, -0.013046741485595703, -0.012477636337280273, -0.011908531188964844, -0.011339426040649414, -0.010770320892333984, -0.010201215744018555, -0.009632110595703125, -0.009063005447387695, -0.008493900299072266, -0.007924795150756836, -0.007355690002441406, -0.0067865848541259766, -0.006217479705810547, -0.005648374557495117, -0.0050792694091796875, -0.004510164260864258, -0.003941059112548828, -0.0033719539642333984, -0.0028028488159179688, -0.002233743667602539, -0.0016646385192871094, -0.0010955333709716797, -0.00052642822265625, 4.267692565917969e-05, 0.0006117820739746094, 0.001180887222290039, 0.0017499923706054688, 0.0023190975189208984, 0.002888202667236328, 0.003457307815551758, 0.0040264129638671875, 0.004595518112182617, 0.005164623260498047, 0.0057337284088134766, 0.006302833557128906, 0.006871938705444336, 0.007441043853759766, 0.008010149002075195, 0.008579254150390625, 0.009148359298706055, 0.009717464447021484, 0.010286569595336914, 0.010855674743652344, 0.011424779891967773, 0.011993885040283203, 0.012562990188598633, 0.013132095336914062, 0.013701200485229492, 0.014270305633544922, 0.014839410781860352, 0.015408515930175781, 0.01597762107849121, 0.01654672622680664, 0.01711583137512207, 0.0176849365234375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 10.0, 14.0, 19.0, 18.0, 21.0, 27.0, 25.0, 34.0, 46.0, 56.0, 65.0, 78.0, 86.0, 61.0, 64.0, 41.0, 60.0, 59.0, 41.0, 30.0, 31.0, 31.0, 14.0, 16.0, 9.0, 11.0, 12.0, 5.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.298324584960938e-06, -9.046867489814758e-06, -8.795410394668579e-06, -8.5439532995224e-06, -8.29249620437622e-06, -8.041039109230042e-06, -7.789582014083862e-06, -7.538124918937683e-06, -7.286667823791504e-06, -7.035210728645325e-06, -6.7837536334991455e-06, -6.532296538352966e-06, -6.280839443206787e-06, -6.029382348060608e-06, -5.777925252914429e-06, -5.5264681577682495e-06, -5.27501106262207e-06, -5.023553967475891e-06, -4.772096872329712e-06, -4.520639777183533e-06, -4.2691826820373535e-06, -4.017725586891174e-06, -3.766268491744995e-06, -3.514811396598816e-06, -3.2633543014526367e-06, -3.0118972063064575e-06, -2.7604401111602783e-06, -2.508983016014099e-06, -2.25752592086792e-06, -2.0060688257217407e-06, -1.7546117305755615e-06, -1.5031546354293823e-06, -1.2516975402832031e-06, -1.000240445137024e-06, -7.487833499908447e-07, -4.973262548446655e-07, -2.4586915969848633e-07, 5.587935447692871e-09, 2.5704503059387207e-07, 5.085021257400513e-07, 7.599592208862305e-07, 1.0114163160324097e-06, 1.2628734111785889e-06, 1.514330506324768e-06, 1.7657876014709473e-06, 2.0172446966171265e-06, 2.2687017917633057e-06, 2.520158886909485e-06, 2.771615982055664e-06, 3.0230730772018433e-06, 3.2745301723480225e-06, 3.5259872674942017e-06, 3.777444362640381e-06, 4.02890145778656e-06, 4.280358552932739e-06, 4.5318156480789185e-06, 4.783272743225098e-06, 5.034729838371277e-06, 5.286186933517456e-06, 5.537644028663635e-06, 5.7891011238098145e-06, 6.040558218955994e-06, 6.292015314102173e-06, 6.543472409248352e-06, 6.794929504394531e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 13.0, 12.0, 27.0, 26.0, 29.0, 47.0, 58.0, 84.0, 125.0, 306.0, 648.0, 1569.0, 4116.0, 13488.0, 54405.0, 273200.0, 521353.0, 136816.0, 29432.0, 8010.0, 2678.0, 1036.0, 433.0, 237.0, 133.0, 89.0, 53.0, 43.0, 25.0, 19.0, 17.0, 9.0, 3.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0231475830078125, -0.02226710319519043, -0.02138662338256836, -0.02050614356994629, -0.01962566375732422, -0.01874518394470215, -0.017864704132080078, -0.016984224319458008, -0.016103744506835938, -0.015223264694213867, -0.014342784881591797, -0.013462305068969727, -0.012581825256347656, -0.011701345443725586, -0.010820865631103516, -0.009940385818481445, -0.009059906005859375, -0.008179426193237305, -0.007298946380615234, -0.006418466567993164, -0.005537986755371094, -0.0046575069427490234, -0.003777027130126953, -0.002896547317504883, -0.0020160675048828125, -0.0011355876922607422, -0.0002551078796386719, 0.0006253719329833984, 0.0015058517456054688, 0.002386331558227539, 0.0032668113708496094, 0.00414729118347168, 0.00502777099609375, 0.00590825080871582, 0.006788730621337891, 0.007669210433959961, 0.008549690246582031, 0.009430170059204102, 0.010310649871826172, 0.011191129684448242, 0.012071609497070312, 0.012952089309692383, 0.013832569122314453, 0.014713048934936523, 0.015593528747558594, 0.016474008560180664, 0.017354488372802734, 0.018234968185424805, 0.019115447998046875, 0.019995927810668945, 0.020876407623291016, 0.021756887435913086, 0.022637367248535156, 0.023517847061157227, 0.024398326873779297, 0.025278806686401367, 0.026159286499023438, 0.027039766311645508, 0.027920246124267578, 0.02880072593688965, 0.02968120574951172, 0.03056168556213379, 0.03144216537475586, 0.03232264518737793, 0.033203125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 11.0, 21.0, 26.0, 45.0, 63.0, 72.0, 90.0, 100.0, 94.0, 103.0, 89.0, 66.0, 59.0, 52.0, 31.0, 12.0, 23.0, 10.0, 4.0, 7.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0204925537109375, -0.019776582717895508, -0.019060611724853516, -0.018344640731811523, -0.01762866973876953, -0.01691269874572754, -0.016196727752685547, -0.015480756759643555, -0.014764785766601562, -0.01404881477355957, -0.013332843780517578, -0.012616872787475586, -0.011900901794433594, -0.011184930801391602, -0.01046895980834961, -0.009752988815307617, -0.009037017822265625, -0.008321046829223633, -0.007605075836181641, -0.0068891048431396484, -0.006173133850097656, -0.005457162857055664, -0.004741191864013672, -0.00402522087097168, -0.0033092498779296875, -0.0025932788848876953, -0.0018773078918457031, -0.001161336898803711, -0.00044536590576171875, 0.00027060508728027344, 0.0009865760803222656, 0.0017025470733642578, 0.00241851806640625, 0.003134489059448242, 0.0038504600524902344, 0.0045664310455322266, 0.005282402038574219, 0.005998373031616211, 0.006714344024658203, 0.007430315017700195, 0.008146286010742188, 0.00886225700378418, 0.009578227996826172, 0.010294198989868164, 0.011010169982910156, 0.011726140975952148, 0.01244211196899414, 0.013158082962036133, 0.013874053955078125, 0.014590024948120117, 0.01530599594116211, 0.0160219669342041, 0.016737937927246094, 0.017453908920288086, 0.018169879913330078, 0.01888585090637207, 0.019601821899414062, 0.020317792892456055, 0.021033763885498047, 0.02174973487854004, 0.02246570587158203, 0.023181676864624023, 0.023897647857666016, 0.024613618850708008, 0.02532958984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 16.0, 33.0, 47.0, 95.0, 159.0, 172.0, 190.0, 129.0, 76.0, 44.0, 24.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14397837221622467, -0.13476581871509552, -0.12555326521396637, -0.11634071916341782, -0.10712817311286926, -0.09791561961174011, -0.08870306611061096, -0.07949052006006241, -0.07027796655893326, -0.061065416783094406, -0.051852867007255554, -0.042640313506126404, -0.03342776373028755, -0.0242152139544487, -0.01500266045331955, -0.005790114402770996, 0.0034224390983581543, 0.01263498980551958, 0.021847540512681007, 0.03106009215116501, 0.04027264192700386, 0.04948519170284271, 0.05869774520397186, 0.06791029125452042, 0.07712284475564957, 0.08633539825677872, 0.09554794430732727, 0.10476049780845642, 0.11397305130958557, 0.12318559736013412, 0.13239815831184387, 0.14161069691181183, 0.15082326531410217, 0.16003581881523132, 0.16924837231636047, 0.17846092581748962, 0.18767346441745758, 0.19688601791858673, 0.20609857141971588, 0.21531111001968384, 0.224523663520813, 0.23373621702194214, 0.2429487705230713, 0.25216132402420044, 0.2613738775253296, 0.27058643102645874, 0.2797989845275879, 0.28901150822639465, 0.2982240915298462, 0.30743664503097534, 0.3166491985321045, 0.32586175203323364, 0.3350743055343628, 0.34428685903549194, 0.3534994125366211, 0.36271193623542786, 0.371924489736557, 0.38113704323768616, 0.3903495967388153, 0.39956215023994446, 0.4087747037410736, 0.41798722743988037, 0.4271997809410095, 0.43641233444213867, 0.4456248879432678]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 6.0, 9.0, 10.0, 12.0, 15.0, 16.0, 21.0, 21.0, 25.0, 19.0, 23.0, 38.0, 19.0, 35.0, 33.0, 41.0, 41.0, 24.0, 29.0, 37.0, 32.0, 39.0, 38.0, 30.0, 33.0, 36.0, 29.0, 27.0, 35.0, 25.0, 26.0, 25.0, 24.0, 22.0, 13.0, 10.0, 11.0, 15.0, 8.0, 11.0, 11.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.15370112657546997, -0.14907239377498627, -0.14444366097450256, -0.13981491327285767, -0.13518618047237396, -0.13055744767189026, -0.12592869997024536, -0.12129996716976166, -0.11667123436927795, -0.11204250156879425, -0.10741376131772995, -0.10278502106666565, -0.09815628826618195, -0.09352755546569824, -0.08889881521463394, -0.08427007496356964, -0.07964134216308594, -0.07501260936260223, -0.07038386911153793, -0.06575512886047363, -0.06112639605998993, -0.05649765953421593, -0.051868923008441925, -0.04724018648266792, -0.04261144995689392, -0.03798271343111992, -0.03335397690534592, -0.028725240379571915, -0.024096503853797913, -0.01946776732802391, -0.014839030802249908, -0.010210294276475906, -0.005581557750701904, -0.0009528212249279022, 0.0036759153008461, 0.008304651826620102, 0.012933388352394104, 0.017562124878168106, 0.022190861403942108, 0.02681959792971611, 0.03144833445549011, 0.036077070981264114, 0.040705807507038116, 0.04533454403281212, 0.04996328055858612, 0.05459201708436012, 0.059220753610134125, 0.06384949386119843, 0.06847822666168213, 0.07310695946216583, 0.07773569971323013, 0.08236443996429443, 0.08699317276477814, 0.09162190556526184, 0.09625064581632614, 0.10087938606739044, 0.10550811886787415, 0.11013685166835785, 0.11476559191942215, 0.11939433217048645, 0.12402306497097015, 0.12865179777145386, 0.13328054547309875, 0.13790927827358246, 0.14253801107406616]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 9.0, 7.0, 11.0, 19.0, 36.0, 67.0, 98.0, 159.0, 293.0, 604.0, 1237.0, 3992.0, 15322.0, 112259.0, 2558642.0, 1423130.0, 62734.0, 10713.0, 3072.0, 962.0, 420.0, 226.0, 115.0, 60.0, 29.0, 22.0, 17.0, 10.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0777587890625, -0.07486629486083984, -0.07197380065917969, -0.06908130645751953, -0.06618881225585938, -0.06329631805419922, -0.06040382385253906, -0.057511329650878906, -0.05461883544921875, -0.051726341247558594, -0.04883384704589844, -0.04594135284423828, -0.043048858642578125, -0.04015636444091797, -0.03726387023925781, -0.034371376037597656, -0.0314788818359375, -0.028586387634277344, -0.025693893432617188, -0.02280139923095703, -0.019908905029296875, -0.01701641082763672, -0.014123916625976562, -0.011231422424316406, -0.00833892822265625, -0.005446434020996094, -0.0025539398193359375, 0.00033855438232421875, 0.003231048583984375, 0.006123542785644531, 0.009016036987304688, 0.011908531188964844, 0.014801025390625, 0.017693519592285156, 0.020586013793945312, 0.02347850799560547, 0.026371002197265625, 0.02926349639892578, 0.03215599060058594, 0.035048484802246094, 0.03794097900390625, 0.040833473205566406, 0.04372596740722656, 0.04661846160888672, 0.049510955810546875, 0.05240345001220703, 0.05529594421386719, 0.058188438415527344, 0.0610809326171875, 0.06397342681884766, 0.06686592102050781, 0.06975841522216797, 0.07265090942382812, 0.07554340362548828, 0.07843589782714844, 0.0813283920288086, 0.08422088623046875, 0.0871133804321289, 0.09000587463378906, 0.09289836883544922, 0.09579086303710938, 0.09868335723876953, 0.10157585144042969, 0.10446834564208984, 0.10736083984375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 10.0, 13.0, 18.0, 34.0, 48.0, 81.0, 101.0, 125.0, 143.0, 104.0, 115.0, 78.0, 49.0, 42.0, 25.0, 10.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09112548828125, -0.08849334716796875, -0.0858612060546875, -0.08322906494140625, -0.080596923828125, -0.07796478271484375, -0.0753326416015625, -0.07270050048828125, -0.070068359375, -0.06743621826171875, -0.0648040771484375, -0.06217193603515625, -0.059539794921875, -0.05690765380859375, -0.0542755126953125, -0.05164337158203125, -0.04901123046875, -0.04637908935546875, -0.0437469482421875, -0.04111480712890625, -0.038482666015625, -0.03585052490234375, -0.0332183837890625, -0.03058624267578125, -0.0279541015625, -0.02532196044921875, -0.0226898193359375, -0.02005767822265625, -0.017425537109375, -0.01479339599609375, -0.0121612548828125, -0.00952911376953125, -0.00689697265625, -0.00426483154296875, -0.0016326904296875, 0.00099945068359375, 0.003631591796875, 0.00626373291015625, 0.0088958740234375, 0.01152801513671875, 0.01416015625, 0.01679229736328125, 0.0194244384765625, 0.02205657958984375, 0.024688720703125, 0.02732086181640625, 0.0299530029296875, 0.03258514404296875, 0.03521728515625, 0.03784942626953125, 0.0404815673828125, 0.04311370849609375, 0.045745849609375, 0.04837799072265625, 0.0510101318359375, 0.05364227294921875, 0.0562744140625, 0.05890655517578125, 0.0615386962890625, 0.06417083740234375, 0.066802978515625, 0.06943511962890625, 0.0720672607421875, 0.07469940185546875, 0.07733154296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 17.0, 21.0, 24.0, 44.0, 55.0, 118.0, 160.0, 263.0, 457.0, 817.0, 1423.0, 2561.0, 4749.0, 9051.0, 18261.0, 38954.0, 89774.0, 240190.0, 866365.0, 1909140.0, 669741.0, 198357.0, 76798.0, 33818.0, 15798.0, 7832.0, 4166.0, 2278.0, 1222.0, 752.0, 398.0, 249.0, 152.0, 105.0, 49.0, 46.0, 15.0, 13.0, 19.0, 7.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0294647216796875, -0.02858281135559082, -0.02770090103149414, -0.02681899070739746, -0.02593708038330078, -0.0250551700592041, -0.024173259735107422, -0.023291349411010742, -0.022409439086914062, -0.021527528762817383, -0.020645618438720703, -0.019763708114624023, -0.018881797790527344, -0.017999887466430664, -0.017117977142333984, -0.016236066818237305, -0.015354156494140625, -0.014472246170043945, -0.013590335845947266, -0.012708425521850586, -0.011826515197753906, -0.010944604873657227, -0.010062694549560547, -0.009180784225463867, -0.008298873901367188, -0.007416963577270508, -0.006535053253173828, -0.0056531429290771484, -0.004771232604980469, -0.003889322280883789, -0.0030074119567871094, -0.0021255016326904297, -0.00124359130859375, -0.0003616809844970703, 0.0005202293395996094, 0.001402139663696289, 0.0022840499877929688, 0.0031659603118896484, 0.004047870635986328, 0.004929780960083008, 0.0058116912841796875, 0.006693601608276367, 0.007575511932373047, 0.008457422256469727, 0.009339332580566406, 0.010221242904663086, 0.011103153228759766, 0.011985063552856445, 0.012866973876953125, 0.013748884201049805, 0.014630794525146484, 0.015512704849243164, 0.016394615173339844, 0.017276525497436523, 0.018158435821533203, 0.019040346145629883, 0.019922256469726562, 0.020804166793823242, 0.021686077117919922, 0.0225679874420166, 0.02344989776611328, 0.02433180809020996, 0.02521371841430664, 0.02609562873840332, 0.0269775390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 4.0, 1.0, 4.0, 6.0, 3.0, 5.0, 2.0, 8.0, 11.0, 6.0, 11.0, 14.0, 10.0, 12.0, 15.0, 29.0, 24.0, 47.0, 49.0, 68.0, 84.0, 101.0, 116.0, 184.0, 243.0, 309.0, 379.0, 436.0, 403.0, 338.0, 289.0, 194.0, 144.0, 118.0, 92.0, 63.0, 42.0, 34.0, 27.0, 28.0, 25.0, 11.0, 18.0, 13.0, 13.0, 9.0, 10.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.0303802490234375, -0.02942371368408203, -0.028467178344726562, -0.027510643005371094, -0.026554107666015625, -0.025597572326660156, -0.024641036987304688, -0.02368450164794922, -0.02272796630859375, -0.02177143096923828, -0.020814895629882812, -0.019858360290527344, -0.018901824951171875, -0.017945289611816406, -0.016988754272460938, -0.01603221893310547, -0.01507568359375, -0.014119148254394531, -0.013162612915039062, -0.012206077575683594, -0.011249542236328125, -0.010293006896972656, -0.009336471557617188, -0.008379936218261719, -0.00742340087890625, -0.006466865539550781, -0.0055103302001953125, -0.004553794860839844, -0.003597259521484375, -0.0026407241821289062, -0.0016841888427734375, -0.0007276535034179688, 0.0002288818359375, 0.0011854171752929688, 0.0021419525146484375, 0.0030984878540039062, 0.004055023193359375, 0.005011558532714844, 0.0059680938720703125, 0.006924629211425781, 0.00788116455078125, 0.008837699890136719, 0.009794235229492188, 0.010750770568847656, 0.011707305908203125, 0.012663841247558594, 0.013620376586914062, 0.014576911926269531, 0.015533447265625, 0.01648998260498047, 0.017446517944335938, 0.018403053283691406, 0.019359588623046875, 0.020316123962402344, 0.021272659301757812, 0.02222919464111328, 0.02318572998046875, 0.02414226531982422, 0.025098800659179688, 0.026055335998535156, 0.027011871337890625, 0.027968406677246094, 0.028924942016601562, 0.02988147735595703, 0.0308380126953125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 10.0, 23.0, 34.0, 64.0, 92.0, 163.0, 152.0, 157.0, 117.0, 82.0, 46.0, 23.0, 16.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.404960036277771, -0.39456427097320557, -0.38416847586631775, -0.37377268075942993, -0.3633769154548645, -0.3529811501502991, -0.34258535504341125, -0.33218955993652344, -0.321793794631958, -0.3113980293273926, -0.30100223422050476, -0.29060643911361694, -0.2802106738090515, -0.2698149085044861, -0.25941911339759827, -0.24902333319187164, -0.23862755298614502, -0.2282317727804184, -0.21783599257469177, -0.20744021236896515, -0.19704443216323853, -0.1866486519575119, -0.17625287175178528, -0.16585709154605865, -0.15546131134033203, -0.1450655311346054, -0.13466975092887878, -0.12427397072315216, -0.11387819051742554, -0.10348241031169891, -0.09308663010597229, -0.08269084990024567, -0.07229506969451904, -0.06189928948879242, -0.051503509283065796, -0.04110772907733917, -0.03071194887161255, -0.020316168665885925, -0.009920388460159302, 0.0004753917455673218, 0.010871171951293945, 0.02126695215702057, 0.03166273236274719, 0.042058512568473816, 0.05245429277420044, 0.06285007297992706, 0.07324585318565369, 0.08364163339138031, 0.09403741359710693, 0.10443319380283356, 0.11482897400856018, 0.1252247542142868, 0.13562053442001343, 0.14601631462574005, 0.15641209483146667, 0.1668078750371933, 0.17720365524291992, 0.18759943544864655, 0.19799521565437317, 0.2083909958600998, 0.21878677606582642, 0.22918255627155304, 0.23957833647727966, 0.2499741166830063, 0.2603698968887329]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 8.0, 10.0, 13.0, 9.0, 11.0, 27.0, 31.0, 19.0, 40.0, 25.0, 37.0, 48.0, 57.0, 52.0, 50.0, 52.0, 54.0, 43.0, 48.0, 44.0, 39.0, 35.0, 31.0, 34.0, 26.0, 25.0, 22.0, 16.0, 21.0, 12.0, 10.0, 6.0, 7.0, 3.0, 9.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15037477016448975, -0.14538130164146423, -0.14038784801959991, -0.1353943794965744, -0.13040092587471008, -0.12540745735168457, -0.12041399627923965, -0.11542053520679474, -0.11042707413434982, -0.10543361306190491, -0.10044015198945999, -0.09544669091701508, -0.09045322239398956, -0.08545976877212524, -0.08046630024909973, -0.07547283917665482, -0.0704793781042099, -0.06548591703176498, -0.06049245595932007, -0.055498991161584854, -0.05050553008913994, -0.04551206901669502, -0.04051860421895981, -0.03552514314651489, -0.030531682074069977, -0.02553822100162506, -0.020544758066534996, -0.015551296062767506, -0.010557834059000015, -0.0055643729865550995, -0.0005709100514650345, 0.0044225528836250305, 0.009416013956069946, 0.014409475959837437, 0.019402937963604927, 0.024396400898694992, 0.029389861971139908, 0.034383323043584824, 0.03937678784132004, 0.044370248913764954, 0.04936370998620987, 0.054357171058654785, 0.0593506321310997, 0.06434409320354462, 0.06933756172657013, 0.07433101534843445, 0.07932448387145996, 0.08431794494390488, 0.08931140601634979, 0.09430486708879471, 0.09929832816123962, 0.10429178923368454, 0.10928525030612946, 0.11427871882915497, 0.11927217990159988, 0.1242656409740448, 0.1292591094970703, 0.13425257802009583, 0.13924603164196014, 0.14423950016498566, 0.14923295378684998, 0.1542264223098755, 0.1592198759317398, 0.16421334445476532, 0.16920679807662964]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 11.0, 13.0, 12.0, 25.0, 35.0, 51.0, 62.0, 78.0, 114.0, 163.0, 270.0, 417.0, 713.0, 1444.0, 3394.0, 9181.0, 29230.0, 108000.0, 393421.0, 363885.0, 96667.0, 26510.0, 8451.0, 3150.0, 1348.0, 678.0, 391.0, 252.0, 159.0, 106.0, 88.0, 46.0, 62.0, 30.0, 19.0, 19.0, 16.0, 8.0, 7.0, 4.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.06623458862304688, -0.06386566162109375, -0.061496734619140625, -0.0591278076171875, -0.056758880615234375, -0.05438995361328125, -0.052021026611328125, -0.049652099609375, -0.047283172607421875, -0.04491424560546875, -0.042545318603515625, -0.0401763916015625, -0.037807464599609375, -0.03543853759765625, -0.033069610595703125, -0.03070068359375, -0.028331756591796875, -0.02596282958984375, -0.023593902587890625, -0.0212249755859375, -0.018856048583984375, -0.01648712158203125, -0.014118194580078125, -0.011749267578125, -0.009380340576171875, -0.00701141357421875, -0.004642486572265625, -0.0022735595703125, 9.5367431640625e-05, 0.00246429443359375, 0.004833221435546875, 0.0072021484375, 0.009571075439453125, 0.01194000244140625, 0.014308929443359375, 0.0166778564453125, 0.019046783447265625, 0.02141571044921875, 0.023784637451171875, 0.026153564453125, 0.028522491455078125, 0.03089141845703125, 0.033260345458984375, 0.0356292724609375, 0.037998199462890625, 0.04036712646484375, 0.042736053466796875, 0.04510498046875, 0.047473907470703125, 0.04984283447265625, 0.052211761474609375, 0.0545806884765625, 0.056949615478515625, 0.05931854248046875, 0.061687469482421875, 0.064056396484375, 0.06642532348632812, 0.06879425048828125, 0.07116317749023438, 0.0735321044921875, 0.07590103149414062, 0.07826995849609375, 0.08063888549804688, 0.0830078125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 13.0, 33.0, 46.0, 76.0, 100.0, 132.0, 148.0, 149.0, 109.0, 76.0, 57.0, 34.0, 9.0, 10.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.100830078125, -0.09799766540527344, -0.09516525268554688, -0.09233283996582031, -0.08950042724609375, -0.08666801452636719, -0.08383560180664062, -0.08100318908691406, -0.0781707763671875, -0.07533836364746094, -0.07250595092773438, -0.06967353820800781, -0.06684112548828125, -0.06400871276855469, -0.061176300048828125, -0.05834388732910156, -0.055511474609375, -0.05267906188964844, -0.049846649169921875, -0.04701423645019531, -0.04418182373046875, -0.04134941101074219, -0.038516998291015625, -0.03568458557128906, -0.0328521728515625, -0.030019760131835938, -0.027187347412109375, -0.024354934692382812, -0.02152252197265625, -0.018690109252929688, -0.015857696533203125, -0.013025283813476562, -0.01019287109375, -0.0073604583740234375, -0.004528045654296875, -0.0016956329345703125, 0.00113677978515625, 0.0039691925048828125, 0.006801605224609375, 0.009634017944335938, 0.0124664306640625, 0.015298843383789062, 0.018131256103515625, 0.020963668823242188, 0.02379608154296875, 0.026628494262695312, 0.029460906982421875, 0.03229331970214844, 0.035125732421875, 0.03795814514160156, 0.040790557861328125, 0.04362297058105469, 0.04645538330078125, 0.04928779602050781, 0.052120208740234375, 0.05495262145996094, 0.0577850341796875, 0.06061744689941406, 0.06344985961914062, 0.06628227233886719, 0.06911468505859375, 0.07194709777832031, 0.07477951049804688, 0.07761192321777344, 0.0804443359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 8.0, 13.0, 11.0, 29.0, 32.0, 48.0, 71.0, 98.0, 156.0, 230.0, 376.0, 756.0, 1417.0, 3014.0, 7447.0, 19253.0, 54556.0, 166748.0, 399657.0, 260196.0, 85541.0, 29312.0, 10887.0, 4427.0, 2046.0, 912.0, 512.0, 262.0, 171.0, 108.0, 62.0, 52.0, 46.0, 22.0, 23.0, 15.0, 10.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04901123046875, -0.04730367660522461, -0.04559612274169922, -0.04388856887817383, -0.04218101501464844, -0.04047346115112305, -0.038765907287597656, -0.037058353424072266, -0.035350799560546875, -0.033643245697021484, -0.031935691833496094, -0.030228137969970703, -0.028520584106445312, -0.026813030242919922, -0.02510547637939453, -0.02339792251586914, -0.02169036865234375, -0.01998281478881836, -0.01827526092529297, -0.016567707061767578, -0.014860153198242188, -0.013152599334716797, -0.011445045471191406, -0.009737491607666016, -0.008029937744140625, -0.006322383880615234, -0.004614830017089844, -0.002907276153564453, -0.0011997222900390625, 0.0005078315734863281, 0.0022153854370117188, 0.003922939300537109, 0.0056304931640625, 0.007338047027587891, 0.009045600891113281, 0.010753154754638672, 0.012460708618164062, 0.014168262481689453, 0.015875816345214844, 0.017583370208740234, 0.019290924072265625, 0.020998477935791016, 0.022706031799316406, 0.024413585662841797, 0.026121139526367188, 0.027828693389892578, 0.02953624725341797, 0.03124380111694336, 0.03295135498046875, 0.03465890884399414, 0.03636646270751953, 0.03807401657104492, 0.03978157043457031, 0.0414891242980957, 0.043196678161621094, 0.044904232025146484, 0.046611785888671875, 0.048319339752197266, 0.050026893615722656, 0.05173444747924805, 0.05344200134277344, 0.05514955520629883, 0.05685710906982422, 0.05856466293334961, 0.060272216796875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 7.0, 3.0, 9.0, 13.0, 13.0, 17.0, 19.0, 24.0, 39.0, 46.0, 45.0, 39.0, 54.0, 57.0, 56.0, 60.0, 53.0, 52.0, 47.0, 56.0, 49.0, 44.0, 32.0, 26.0, 25.0, 29.0, 23.0, 10.0, 8.0, 12.0, 8.0, 7.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08526611328125, -0.08250713348388672, -0.07974815368652344, -0.07698917388916016, -0.07423019409179688, -0.0714712142944336, -0.06871223449707031, -0.06595325469970703, -0.06319427490234375, -0.06043529510498047, -0.05767631530761719, -0.054917335510253906, -0.052158355712890625, -0.049399375915527344, -0.04664039611816406, -0.04388141632080078, -0.0411224365234375, -0.03836345672607422, -0.03560447692871094, -0.032845497131347656, -0.030086517333984375, -0.027327537536621094, -0.024568557739257812, -0.02180957794189453, -0.01905059814453125, -0.01629161834716797, -0.013532638549804688, -0.010773658752441406, -0.008014678955078125, -0.005255699157714844, -0.0024967193603515625, 0.00026226043701171875, 0.003021240234375, 0.005780220031738281, 0.008539199829101562, 0.011298179626464844, 0.014057159423828125, 0.016816139221191406, 0.019575119018554688, 0.02233409881591797, 0.02509307861328125, 0.02785205841064453, 0.030611038208007812, 0.033370018005371094, 0.036128997802734375, 0.038887977600097656, 0.04164695739746094, 0.04440593719482422, 0.0471649169921875, 0.04992389678955078, 0.05268287658691406, 0.055441856384277344, 0.058200836181640625, 0.060959815979003906, 0.06371879577636719, 0.06647777557373047, 0.06923675537109375, 0.07199573516845703, 0.07475471496582031, 0.0775136947631836, 0.08027267456054688, 0.08303165435791016, 0.08579063415527344, 0.08854961395263672, 0.09130859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 12.0, 19.0, 25.0, 35.0, 60.0, 103.0, 174.0, 314.0, 642.0, 1301.0, 2798.0, 6553.0, 15506.0, 39503.0, 107172.0, 292836.0, 350948.0, 144310.0, 51410.0, 19896.0, 8103.0, 3550.0, 1613.0, 788.0, 377.0, 200.0, 110.0, 67.0, 47.0, 27.0, 13.0, 14.0, 8.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019012451171875, -0.01845550537109375, -0.0178985595703125, -0.01734161376953125, -0.01678466796875, -0.01622772216796875, -0.0156707763671875, -0.01511383056640625, -0.014556884765625, -0.01399993896484375, -0.0134429931640625, -0.01288604736328125, -0.0123291015625, -0.01177215576171875, -0.0112152099609375, -0.01065826416015625, -0.010101318359375, -0.00954437255859375, -0.0089874267578125, -0.00843048095703125, -0.00787353515625, -0.00731658935546875, -0.0067596435546875, -0.00620269775390625, -0.005645751953125, -0.00508880615234375, -0.0045318603515625, -0.00397491455078125, -0.00341796875, -0.00286102294921875, -0.0023040771484375, -0.00174713134765625, -0.001190185546875, -0.00063323974609375, -7.62939453125e-05, 0.00048065185546875, 0.00103759765625, 0.00159454345703125, 0.0021514892578125, 0.00270843505859375, 0.003265380859375, 0.00382232666015625, 0.0043792724609375, 0.00493621826171875, 0.0054931640625, 0.00605010986328125, 0.0066070556640625, 0.00716400146484375, 0.007720947265625, 0.00827789306640625, 0.0088348388671875, 0.00939178466796875, 0.00994873046875, 0.01050567626953125, 0.0110626220703125, 0.01161956787109375, 0.012176513671875, 0.01273345947265625, 0.0132904052734375, 0.01384735107421875, 0.014404296875, 0.01496124267578125, 0.0155181884765625, 0.01607513427734375, 0.016632080078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 10.0, 7.0, 12.0, 14.0, 22.0, 32.0, 55.0, 50.0, 69.0, 106.0, 80.0, 99.0, 90.0, 90.0, 51.0, 44.0, 36.0, 34.0, 23.0, 15.0, 11.0, 3.0, 6.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138448715209961e-05, -1.1050142347812653e-05, -1.0715797543525696e-05, -1.0381452739238739e-05, -1.0047107934951782e-05, -9.712763130664825e-06, -9.378418326377869e-06, -9.044073522090912e-06, -8.709728717803955e-06, -8.375383913516998e-06, -8.041039109230042e-06, -7.706694304943085e-06, -7.372349500656128e-06, -7.038004696369171e-06, -6.703659892082214e-06, -6.3693150877952576e-06, -6.034970283508301e-06, -5.700625479221344e-06, -5.366280674934387e-06, -5.03193587064743e-06, -4.697591066360474e-06, -4.363246262073517e-06, -4.02890145778656e-06, -3.6945566534996033e-06, -3.3602118492126465e-06, -3.0258670449256897e-06, -2.691522240638733e-06, -2.357177436351776e-06, -2.0228326320648193e-06, -1.6884878277778625e-06, -1.3541430234909058e-06, -1.019798219203949e-06, -6.854534149169922e-07, -3.511086106300354e-07, -1.6763806343078613e-08, 3.175809979438782e-07, 6.51925802230835e-07, 9.862706065177917e-07, 1.3206154108047485e-06, 1.6549602150917053e-06, 1.989305019378662e-06, 2.323649823665619e-06, 2.6579946279525757e-06, 2.9923394322395325e-06, 3.3266842365264893e-06, 3.661029040813446e-06, 3.995373845100403e-06, 4.32971864938736e-06, 4.664063453674316e-06, 4.998408257961273e-06, 5.33275306224823e-06, 5.667097866535187e-06, 6.0014426708221436e-06, 6.3357874751091e-06, 6.670132279396057e-06, 7.004477083683014e-06, 7.338821887969971e-06, 7.673166692256927e-06, 8.007511496543884e-06, 8.341856300830841e-06, 8.676201105117798e-06, 9.010545909404755e-06, 9.344890713691711e-06, 9.679235517978668e-06, 1.0013580322265625e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 9.0, 9.0, 11.0, 29.0, 41.0, 46.0, 73.0, 83.0, 161.0, 254.0, 466.0, 934.0, 1726.0, 3468.0, 7000.0, 14656.0, 32842.0, 78309.0, 183682.0, 306706.0, 232483.0, 104999.0, 43721.0, 18927.0, 8804.0, 4317.0, 2163.0, 1116.0, 624.0, 365.0, 185.0, 110.0, 70.0, 48.0, 34.0, 22.0, 14.0, 12.0, 9.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.016998291015625, -0.016521692276000977, -0.016045093536376953, -0.01556849479675293, -0.015091896057128906, -0.014615297317504883, -0.01413869857788086, -0.013662099838256836, -0.013185501098632812, -0.012708902359008789, -0.012232303619384766, -0.011755704879760742, -0.011279106140136719, -0.010802507400512695, -0.010325908660888672, -0.009849309921264648, -0.009372711181640625, -0.008896112442016602, -0.008419513702392578, -0.007942914962768555, -0.007466316223144531, -0.006989717483520508, -0.006513118743896484, -0.006036520004272461, -0.0055599212646484375, -0.005083322525024414, -0.004606723785400391, -0.004130125045776367, -0.0036535263061523438, -0.0031769275665283203, -0.002700328826904297, -0.0022237300872802734, -0.00174713134765625, -0.0012705326080322266, -0.0007939338684082031, -0.0003173351287841797, 0.00015926361083984375, 0.0006358623504638672, 0.0011124610900878906, 0.001589059829711914, 0.0020656585693359375, 0.002542257308959961, 0.0030188560485839844, 0.003495454788208008, 0.003972053527832031, 0.004448652267456055, 0.004925251007080078, 0.0054018497467041016, 0.005878448486328125, 0.0063550472259521484, 0.006831645965576172, 0.007308244705200195, 0.007784843444824219, 0.008261442184448242, 0.008738040924072266, 0.009214639663696289, 0.009691238403320312, 0.010167837142944336, 0.01064443588256836, 0.011121034622192383, 0.011597633361816406, 0.01207423210144043, 0.012550830841064453, 0.013027429580688477, 0.0135040283203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 11.0, 11.0, 18.0, 21.0, 29.0, 34.0, 44.0, 62.0, 68.0, 72.0, 76.0, 88.0, 69.0, 65.0, 79.0, 61.0, 37.0, 36.0, 26.0, 22.0, 12.0, 12.0, 12.0, 7.0, 10.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0206451416015625, -0.020056962966918945, -0.01946878433227539, -0.018880605697631836, -0.01829242706298828, -0.017704248428344727, -0.017116069793701172, -0.016527891159057617, -0.015939712524414062, -0.015351533889770508, -0.014763355255126953, -0.014175176620483398, -0.013586997985839844, -0.012998819351196289, -0.012410640716552734, -0.01182246208190918, -0.011234283447265625, -0.01064610481262207, -0.010057926177978516, -0.009469747543334961, -0.008881568908691406, -0.008293390274047852, -0.007705211639404297, -0.007117033004760742, -0.0065288543701171875, -0.005940675735473633, -0.005352497100830078, -0.0047643184661865234, -0.004176139831542969, -0.003587961196899414, -0.0029997825622558594, -0.0024116039276123047, -0.00182342529296875, -0.0012352466583251953, -0.0006470680236816406, -5.888938903808594e-05, 0.0005292892456054688, 0.0011174678802490234, 0.0017056465148925781, 0.002293825149536133, 0.0028820037841796875, 0.003470182418823242, 0.004058361053466797, 0.0046465396881103516, 0.005234718322753906, 0.005822896957397461, 0.006411075592041016, 0.00699925422668457, 0.007587432861328125, 0.00817561149597168, 0.008763790130615234, 0.009351968765258789, 0.009940147399902344, 0.010528326034545898, 0.011116504669189453, 0.011704683303833008, 0.012292861938476562, 0.012881040573120117, 0.013469219207763672, 0.014057397842407227, 0.014645576477050781, 0.015233755111694336, 0.01582193374633789, 0.016410112380981445, 0.016998291015625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 34.0, 70.0, 113.0, 130.0, 176.0, 144.0, 124.0, 90.0, 53.0, 27.0, 10.0, 4.0, 3.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32812750339508057, -0.31812193989753723, -0.3081164062023163, -0.29811084270477295, -0.288105309009552, -0.27809974551200867, -0.26809418201446533, -0.2580886483192444, -0.24808308482170105, -0.2380775362253189, -0.22807198762893677, -0.21806642413139343, -0.2080608755350113, -0.19805532693862915, -0.18804976344108582, -0.17804421484470367, -0.16803866624832153, -0.1580331176519394, -0.14802756905555725, -0.13802200555801392, -0.12801645696163177, -0.11801090836524963, -0.1080053523182869, -0.09799979627132416, -0.08799424767494202, -0.07798869907855988, -0.06798314303159714, -0.0579775907099247, -0.04797203838825226, -0.03796648606657982, -0.02796093374490738, -0.01795537769794464, -0.0079498291015625, 0.0020557232201099396, 0.01206127554178238, 0.02206682786345482, 0.03207238018512726, 0.0420779325067997, 0.05208348482847214, 0.062089040875434875, 0.07209458947181702, 0.08210013806819916, 0.0921056941151619, 0.10211125016212463, 0.11211679875850677, 0.12212234735488892, 0.13212791085243225, 0.1421334594488144, 0.15213900804519653, 0.16214455664157867, 0.17215010523796082, 0.18215566873550415, 0.1921612173318863, 0.20216676592826843, 0.21217232942581177, 0.2221778780221939, 0.23218342661857605, 0.2421889752149582, 0.25219452381134033, 0.26220008730888367, 0.272205650806427, 0.28221118450164795, 0.2922167479991913, 0.3022223114967346, 0.31222784519195557]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 10.0, 5.0, 18.0, 15.0, 11.0, 16.0, 11.0, 23.0, 27.0, 21.0, 28.0, 35.0, 43.0, 36.0, 45.0, 34.0, 48.0, 41.0, 50.0, 41.0, 42.0, 47.0, 39.0, 46.0, 32.0, 30.0, 29.0, 25.0, 17.0, 21.0, 16.0, 18.0, 17.0, 18.0, 7.0, 9.0, 6.0, 4.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.16635072231292725, -0.16050544381141663, -0.1546601504087448, -0.148814857006073, -0.14296957850456238, -0.13712430000305176, -0.13127900660037994, -0.12543371319770813, -0.11958843469619751, -0.11374314874410629, -0.10789786279201508, -0.10205257683992386, -0.09620729088783264, -0.09036200493574142, -0.08451671898365021, -0.07867143303155899, -0.07282614707946777, -0.06698086112737656, -0.06113557517528534, -0.05529028922319412, -0.049445003271102905, -0.04359971731901169, -0.03775443136692047, -0.031909145414829254, -0.026063859462738037, -0.02021857351064682, -0.014373287558555603, -0.008528001606464386, -0.002682715654373169, 0.003162570297718048, 0.009007856249809265, 0.014853142201900482, 0.0206984281539917, 0.026543714106082916, 0.03238900005817413, 0.03823428601026535, 0.04407957196235657, 0.049924857914447784, 0.055770143866539, 0.06161542981863022, 0.06746071577072144, 0.07330600172281265, 0.07915128767490387, 0.08499657362699509, 0.0908418595790863, 0.09668714553117752, 0.10253243148326874, 0.10837771743535995, 0.11422300338745117, 0.12006828933954239, 0.1259135752916336, 0.13175886869430542, 0.13760414719581604, 0.14344942569732666, 0.14929471909999847, 0.1551400125026703, 0.1609852910041809, 0.16683056950569153, 0.17267586290836334, 0.17852115631103516, 0.18436643481254578, 0.1902117133140564, 0.1960570067167282, 0.20190230011940002, 0.20774757862091064]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 16.0, 22.0, 44.0, 65.0, 127.0, 218.0, 423.0, 835.0, 1849.0, 6709.0, 29624.0, 395881.0, 3366860.0, 354780.0, 27523.0, 5998.0, 1885.0, 661.0, 337.0, 155.0, 102.0, 62.0, 33.0, 21.0, 13.0, 2.0, 1.0, 6.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0927734375, -0.08982658386230469, -0.08687973022460938, -0.08393287658691406, -0.08098602294921875, -0.07803916931152344, -0.07509231567382812, -0.07214546203613281, -0.0691986083984375, -0.06625175476074219, -0.06330490112304688, -0.06035804748535156, -0.05741119384765625, -0.05446434020996094, -0.051517486572265625, -0.04857063293457031, -0.045623779296875, -0.04267692565917969, -0.039730072021484375, -0.03678321838378906, -0.03383636474609375, -0.030889511108398438, -0.027942657470703125, -0.024995803833007812, -0.0220489501953125, -0.019102096557617188, -0.016155242919921875, -0.013208389282226562, -0.01026153564453125, -0.0073146820068359375, -0.004367828369140625, -0.0014209747314453125, 0.00152587890625, 0.0044727325439453125, 0.007419586181640625, 0.010366439819335938, 0.01331329345703125, 0.016260147094726562, 0.019207000732421875, 0.022153854370117188, 0.0251007080078125, 0.028047561645507812, 0.030994415283203125, 0.03394126892089844, 0.03688812255859375, 0.03983497619628906, 0.042781829833984375, 0.04572868347167969, 0.048675537109375, 0.05162239074707031, 0.054569244384765625, 0.05751609802246094, 0.06046295166015625, 0.06340980529785156, 0.06635665893554688, 0.06930351257324219, 0.0722503662109375, 0.07519721984863281, 0.07814407348632812, 0.08109092712402344, 0.08403778076171875, 0.08698463439941406, 0.08993148803710938, 0.09287834167480469, 0.0958251953125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 13.0, 26.0, 51.0, 66.0, 101.0, 135.0, 148.0, 126.0, 106.0, 89.0, 62.0, 37.0, 21.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09375, -0.0910491943359375, -0.088348388671875, -0.0856475830078125, -0.08294677734375, -0.0802459716796875, -0.077545166015625, -0.0748443603515625, -0.0721435546875, -0.0694427490234375, -0.066741943359375, -0.0640411376953125, -0.06134033203125, -0.0586395263671875, -0.055938720703125, -0.0532379150390625, -0.050537109375, -0.0478363037109375, -0.045135498046875, -0.0424346923828125, -0.03973388671875, -0.0370330810546875, -0.034332275390625, -0.0316314697265625, -0.0289306640625, -0.0262298583984375, -0.023529052734375, -0.0208282470703125, -0.01812744140625, -0.0154266357421875, -0.012725830078125, -0.0100250244140625, -0.00732421875, -0.0046234130859375, -0.001922607421875, 0.0007781982421875, 0.00347900390625, 0.0061798095703125, 0.008880615234375, 0.0115814208984375, 0.0142822265625, 0.0169830322265625, 0.019683837890625, 0.0223846435546875, 0.02508544921875, 0.0277862548828125, 0.030487060546875, 0.0331878662109375, 0.035888671875, 0.0385894775390625, 0.041290283203125, 0.0439910888671875, 0.04669189453125, 0.0493927001953125, 0.052093505859375, 0.0547943115234375, 0.0574951171875, 0.0601959228515625, 0.062896728515625, 0.0655975341796875, 0.06829833984375, 0.0709991455078125, 0.073699951171875, 0.0764007568359375, 0.0791015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 10.0, 12.0, 26.0, 52.0, 41.0, 82.0, 118.0, 211.0, 400.0, 730.0, 1450.0, 3400.0, 8174.0, 22435.0, 71331.0, 281144.0, 1801319.0, 1642489.0, 258565.0, 66599.0, 21483.0, 7900.0, 3215.0, 1473.0, 681.0, 391.0, 210.0, 125.0, 67.0, 57.0, 39.0, 24.0, 11.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041961669921875, -0.040561676025390625, -0.03916168212890625, -0.037761688232421875, -0.0363616943359375, -0.034961700439453125, -0.03356170654296875, -0.032161712646484375, -0.03076171875, -0.029361724853515625, -0.02796173095703125, -0.026561737060546875, -0.0251617431640625, -0.023761749267578125, -0.02236175537109375, -0.020961761474609375, -0.019561767578125, -0.018161773681640625, -0.01676177978515625, -0.015361785888671875, -0.0139617919921875, -0.012561798095703125, -0.01116180419921875, -0.009761810302734375, -0.00836181640625, -0.006961822509765625, -0.00556182861328125, -0.004161834716796875, -0.0027618408203125, -0.001361846923828125, 3.814697265625e-05, 0.001438140869140625, 0.002838134765625, 0.004238128662109375, 0.00563812255859375, 0.007038116455078125, 0.0084381103515625, 0.009838104248046875, 0.01123809814453125, 0.012638092041015625, 0.0140380859375, 0.015438079833984375, 0.01683807373046875, 0.018238067626953125, 0.0196380615234375, 0.021038055419921875, 0.02243804931640625, 0.023838043212890625, 0.025238037109375, 0.026638031005859375, 0.02803802490234375, 0.029438018798828125, 0.0308380126953125, 0.032238006591796875, 0.03363800048828125, 0.035037994384765625, 0.03643798828125, 0.037837982177734375, 0.03923797607421875, 0.040637969970703125, 0.0420379638671875, 0.043437957763671875, 0.04483795166015625, 0.046237945556640625, 0.047637939453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 8.0, 10.0, 10.0, 17.0, 24.0, 35.0, 38.0, 47.0, 84.0, 123.0, 171.0, 284.0, 483.0, 610.0, 618.0, 490.0, 315.0, 202.0, 142.0, 83.0, 69.0, 53.0, 36.0, 22.0, 27.0, 18.0, 9.0, 8.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.046234130859375, -0.044701576232910156, -0.04316902160644531, -0.04163646697998047, -0.040103912353515625, -0.03857135772705078, -0.03703880310058594, -0.035506248474121094, -0.03397369384765625, -0.032441139221191406, -0.030908584594726562, -0.02937602996826172, -0.027843475341796875, -0.02631092071533203, -0.024778366088867188, -0.023245811462402344, -0.0217132568359375, -0.020180702209472656, -0.018648147583007812, -0.01711559295654297, -0.015583038330078125, -0.014050483703613281, -0.012517929077148438, -0.010985374450683594, -0.00945281982421875, -0.007920265197753906, -0.0063877105712890625, -0.004855155944824219, -0.003322601318359375, -0.0017900466918945312, -0.0002574920654296875, 0.0012750625610351562, 0.0028076171875, 0.004340171813964844, 0.0058727264404296875, 0.007405281066894531, 0.008937835693359375, 0.010470390319824219, 0.012002944946289062, 0.013535499572753906, 0.01506805419921875, 0.016600608825683594, 0.018133163452148438, 0.01966571807861328, 0.021198272705078125, 0.02273082733154297, 0.024263381958007812, 0.025795936584472656, 0.0273284912109375, 0.028861045837402344, 0.030393600463867188, 0.03192615509033203, 0.033458709716796875, 0.03499126434326172, 0.03652381896972656, 0.038056373596191406, 0.03958892822265625, 0.041121482849121094, 0.04265403747558594, 0.04418659210205078, 0.045719146728515625, 0.04725170135498047, 0.04878425598144531, 0.050316810607910156, 0.051849365234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 17.0, 41.0, 127.0, 240.0, 249.0, 191.0, 88.0, 31.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.9638176560401917, -0.9446650147438049, -0.9255123138427734, -0.9063596725463867, -0.8872069716453552, -0.8680543303489685, -0.848901629447937, -0.8297489881515503, -0.8105963468551636, -0.7914437055587769, -0.7722910046577454, -0.7531383633613586, -0.7339856624603271, -0.7148330211639404, -0.6956803202629089, -0.6765276789665222, -0.6573749780654907, -0.638222336769104, -0.6190696358680725, -0.5999169945716858, -0.5807642936706543, -0.5616116523742676, -0.5424589514732361, -0.5233063101768494, -0.5041536092758179, -0.48500093817710876, -0.46584826707839966, -0.44669559597969055, -0.42754292488098145, -0.4083902835845947, -0.3892376124858856, -0.3700849413871765, -0.3509323000907898, -0.3317796289920807, -0.3126269578933716, -0.2934742867946625, -0.27432161569595337, -0.25516897439956665, -0.23601630330085754, -0.21686363220214844, -0.19771096110343933, -0.17855829000473022, -0.15940561890602112, -0.1402529627084732, -0.1211002916097641, -0.10194762051105499, -0.08279495686292648, -0.06364229321479797, -0.04448962211608887, -0.02533695474267006, -0.006184287369251251, 0.012968380004167557, 0.032121047377586365, 0.05127371847629547, 0.07042638212442398, 0.08957904577255249, 0.1087317168712616, 0.1278843879699707, 0.1470370590686798, 0.16618971526622772, 0.18534238636493683, 0.20449505746364594, 0.22364771366119385, 0.24280038475990295, 0.26195305585861206]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 12.0, 14.0, 19.0, 18.0, 17.0, 16.0, 22.0, 20.0, 29.0, 33.0, 43.0, 28.0, 43.0, 43.0, 38.0, 36.0, 38.0, 46.0, 34.0, 38.0, 28.0, 33.0, 42.0, 29.0, 27.0, 30.0, 33.0, 24.0, 16.0, 21.0, 20.0, 18.0, 13.0, 8.0, 11.0, 10.0, 6.0, 4.0, 3.0, 4.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.1492345929145813, -0.14481954276561737, -0.14040449261665344, -0.13598942756652832, -0.1315743774175644, -0.12715932726860046, -0.12274427711963654, -0.11832922697067261, -0.11391416937112808, -0.10949911922216415, -0.10508406162261963, -0.1006690114736557, -0.09625396132469177, -0.09183890372514725, -0.08742385357618332, -0.0830087959766388, -0.07859374582767487, -0.07417869567871094, -0.06976363807916641, -0.06534858793020248, -0.06093353405594826, -0.05651848018169403, -0.0521034300327301, -0.047688376158475876, -0.04327332228422165, -0.03885826840996742, -0.034443214535713196, -0.030028164386749268, -0.02561311051249504, -0.021198056638240814, -0.016783004626631737, -0.01236795261502266, -0.007952898740768433, -0.0035378457978367805, 0.0008772071450948715, 0.005292260088026524, 0.009707313030958176, 0.014122366905212402, 0.01853741891682148, 0.022952470928430557, 0.027367524802684784, 0.03178257867693901, 0.03619763255119324, 0.040612682700157166, 0.04502773657441139, 0.04944279044866562, 0.05385784059762955, 0.058272894471883774, 0.062687948346138, 0.06710299849510193, 0.07151805609464645, 0.07593310624361038, 0.08034816384315491, 0.08476321399211884, 0.08917826414108276, 0.09359331429004669, 0.09800837188959122, 0.10242342203855515, 0.10683847963809967, 0.1112535297870636, 0.11566857993602753, 0.12008363753557205, 0.12449868768453598, 0.1289137452840805, 0.13332879543304443]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 10.0, 13.0, 9.0, 13.0, 25.0, 38.0, 41.0, 71.0, 106.0, 185.0, 254.0, 401.0, 756.0, 1344.0, 2852.0, 7129.0, 20451.0, 62449.0, 229293.0, 474466.0, 171788.0, 49630.0, 16077.0, 5767.0, 2468.0, 1198.0, 649.0, 394.0, 232.0, 128.0, 95.0, 64.0, 47.0, 26.0, 29.0, 24.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07452392578125, -0.07215023040771484, -0.06977653503417969, -0.06740283966064453, -0.06502914428710938, -0.06265544891357422, -0.06028175354003906, -0.057908058166503906, -0.05553436279296875, -0.053160667419433594, -0.05078697204589844, -0.04841327667236328, -0.046039581298828125, -0.04366588592529297, -0.04129219055175781, -0.038918495178222656, -0.0365447998046875, -0.034171104431152344, -0.03179740905761719, -0.02942371368408203, -0.027050018310546875, -0.02467632293701172, -0.022302627563476562, -0.019928932189941406, -0.01755523681640625, -0.015181541442871094, -0.012807846069335938, -0.010434150695800781, -0.008060455322265625, -0.005686759948730469, -0.0033130645751953125, -0.0009393692016601562, 0.001434326171875, 0.0038080215454101562, 0.0061817169189453125, 0.008555412292480469, 0.010929107666015625, 0.013302803039550781, 0.015676498413085938, 0.018050193786621094, 0.02042388916015625, 0.022797584533691406, 0.025171279907226562, 0.02754497528076172, 0.029918670654296875, 0.03229236602783203, 0.03466606140136719, 0.037039756774902344, 0.0394134521484375, 0.041787147521972656, 0.04416084289550781, 0.04653453826904297, 0.048908233642578125, 0.05128192901611328, 0.05365562438964844, 0.056029319763183594, 0.05840301513671875, 0.060776710510253906, 0.06315040588378906, 0.06552410125732422, 0.06789779663085938, 0.07027149200439453, 0.07264518737792969, 0.07501888275146484, 0.077392578125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 19.0, 39.0, 51.0, 72.0, 90.0, 139.0, 130.0, 115.0, 133.0, 87.0, 52.0, 35.0, 20.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0904541015625, -0.08783817291259766, -0.08522224426269531, -0.08260631561279297, -0.07999038696289062, -0.07737445831298828, -0.07475852966308594, -0.0721426010131836, -0.06952667236328125, -0.0669107437133789, -0.06429481506347656, -0.06167888641357422, -0.059062957763671875, -0.05644702911376953, -0.05383110046386719, -0.051215171813964844, -0.0485992431640625, -0.045983314514160156, -0.04336738586425781, -0.04075145721435547, -0.038135528564453125, -0.03551959991455078, -0.03290367126464844, -0.030287742614746094, -0.02767181396484375, -0.025055885314941406, -0.022439956665039062, -0.01982402801513672, -0.017208099365234375, -0.014592170715332031, -0.011976242065429688, -0.009360313415527344, -0.006744384765625, -0.004128456115722656, -0.0015125274658203125, 0.0011034011840820312, 0.003719329833984375, 0.006335258483886719, 0.008951187133789062, 0.011567115783691406, 0.01418304443359375, 0.016798973083496094, 0.019414901733398438, 0.02203083038330078, 0.024646759033203125, 0.02726268768310547, 0.029878616333007812, 0.032494544982910156, 0.0351104736328125, 0.037726402282714844, 0.04034233093261719, 0.04295825958251953, 0.045574188232421875, 0.04819011688232422, 0.05080604553222656, 0.053421974182128906, 0.05603790283203125, 0.058653831481933594, 0.06126976013183594, 0.06388568878173828, 0.06650161743164062, 0.06911754608154297, 0.07173347473144531, 0.07434940338134766, 0.07696533203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 4.0, 9.0, 7.0, 11.0, 21.0, 23.0, 34.0, 43.0, 67.0, 81.0, 147.0, 258.0, 427.0, 714.0, 1350.0, 2870.0, 7210.0, 20681.0, 66444.0, 253292.0, 475809.0, 152720.0, 42490.0, 13865.0, 5160.0, 2214.0, 1058.0, 508.0, 343.0, 213.0, 155.0, 89.0, 73.0, 39.0, 38.0, 19.0, 15.0, 6.0, 5.0, 7.0, 5.0, 5.0, 8.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0], "bins": [-0.07489013671875, -0.0727696418762207, -0.0706491470336914, -0.06852865219116211, -0.06640815734863281, -0.06428766250610352, -0.06216716766357422, -0.06004667282104492, -0.057926177978515625, -0.05580568313598633, -0.05368518829345703, -0.051564693450927734, -0.04944419860839844, -0.04732370376586914, -0.045203208923339844, -0.04308271408081055, -0.04096221923828125, -0.03884172439575195, -0.036721229553222656, -0.03460073471069336, -0.03248023986816406, -0.030359745025634766, -0.02823925018310547, -0.026118755340576172, -0.023998260498046875, -0.021877765655517578, -0.01975727081298828, -0.017636775970458984, -0.015516281127929688, -0.01339578628540039, -0.011275291442871094, -0.009154796600341797, -0.0070343017578125, -0.004913806915283203, -0.0027933120727539062, -0.0006728172302246094, 0.0014476776123046875, 0.0035681724548339844, 0.005688667297363281, 0.007809162139892578, 0.009929656982421875, 0.012050151824951172, 0.014170646667480469, 0.016291141510009766, 0.018411636352539062, 0.02053213119506836, 0.022652626037597656, 0.024773120880126953, 0.02689361572265625, 0.029014110565185547, 0.031134605407714844, 0.03325510025024414, 0.03537559509277344, 0.037496089935302734, 0.03961658477783203, 0.04173707962036133, 0.043857574462890625, 0.04597806930541992, 0.04809856414794922, 0.050219058990478516, 0.05233955383300781, 0.05446004867553711, 0.056580543518066406, 0.0587010383605957, 0.060821533203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 4.0, 9.0, 4.0, 9.0, 5.0, 16.0, 20.0, 16.0, 29.0, 36.0, 34.0, 39.0, 45.0, 48.0, 52.0, 60.0, 55.0, 59.0, 61.0, 55.0, 53.0, 41.0, 48.0, 31.0, 37.0, 32.0, 25.0, 14.0, 11.0, 10.0, 12.0, 8.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06732177734375, -0.06452083587646484, -0.06171989440917969, -0.05891895294189453, -0.056118011474609375, -0.05331707000732422, -0.05051612854003906, -0.047715187072753906, -0.04491424560546875, -0.042113304138183594, -0.03931236267089844, -0.03651142120361328, -0.033710479736328125, -0.03090953826904297, -0.028108596801757812, -0.025307655334472656, -0.0225067138671875, -0.019705772399902344, -0.016904830932617188, -0.014103889465332031, -0.011302947998046875, -0.008502006530761719, -0.0057010650634765625, -0.0029001235961914062, -9.918212890625e-05, 0.0027017593383789062, 0.0055027008056640625, 0.008303642272949219, 0.011104583740234375, 0.013905525207519531, 0.016706466674804688, 0.019507408142089844, 0.022308349609375, 0.025109291076660156, 0.027910232543945312, 0.03071117401123047, 0.033512115478515625, 0.03631305694580078, 0.03911399841308594, 0.041914939880371094, 0.04471588134765625, 0.047516822814941406, 0.05031776428222656, 0.05311870574951172, 0.055919647216796875, 0.05872058868408203, 0.06152153015136719, 0.06432247161865234, 0.0671234130859375, 0.06992435455322266, 0.07272529602050781, 0.07552623748779297, 0.07832717895507812, 0.08112812042236328, 0.08392906188964844, 0.0867300033569336, 0.08953094482421875, 0.0923318862915039, 0.09513282775878906, 0.09793376922607422, 0.10073471069335938, 0.10353565216064453, 0.10633659362792969, 0.10913753509521484, 0.1119384765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 4.0, 5.0, 28.0, 25.0, 44.0, 73.0, 110.0, 253.0, 379.0, 792.0, 1444.0, 2918.0, 6187.0, 15997.0, 52147.0, 199717.0, 507631.0, 184960.0, 48659.0, 15191.0, 5973.0, 2944.0, 1445.0, 723.0, 379.0, 204.0, 108.0, 80.0, 44.0, 27.0, 17.0, 10.0, 8.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0255889892578125, -0.024775981903076172, -0.023962974548339844, -0.023149967193603516, -0.022336959838867188, -0.02152395248413086, -0.02071094512939453, -0.019897937774658203, -0.019084930419921875, -0.018271923065185547, -0.01745891571044922, -0.01664590835571289, -0.015832901000976562, -0.015019893646240234, -0.014206886291503906, -0.013393878936767578, -0.01258087158203125, -0.011767864227294922, -0.010954856872558594, -0.010141849517822266, -0.009328842163085938, -0.00851583480834961, -0.007702827453613281, -0.006889820098876953, -0.006076812744140625, -0.005263805389404297, -0.004450798034667969, -0.0036377906799316406, -0.0028247833251953125, -0.0020117759704589844, -0.0011987686157226562, -0.0003857612609863281, 0.00042724609375, 0.0012402534484863281, 0.0020532608032226562, 0.0028662681579589844, 0.0036792755126953125, 0.004492282867431641, 0.005305290222167969, 0.006118297576904297, 0.006931304931640625, 0.007744312286376953, 0.008557319641113281, 0.00937032699584961, 0.010183334350585938, 0.010996341705322266, 0.011809349060058594, 0.012622356414794922, 0.01343536376953125, 0.014248371124267578, 0.015061378479003906, 0.015874385833740234, 0.016687393188476562, 0.01750040054321289, 0.01831340789794922, 0.019126415252685547, 0.019939422607421875, 0.020752429962158203, 0.02156543731689453, 0.02237844467163086, 0.023191452026367188, 0.024004459381103516, 0.024817466735839844, 0.025630474090576172, 0.0264434814453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 4.0, 1.0, 6.0, 5.0, 9.0, 5.0, 18.0, 15.0, 18.0, 27.0, 45.0, 41.0, 56.0, 64.0, 92.0, 81.0, 89.0, 80.0, 75.0, 60.0, 30.0, 38.0, 28.0, 25.0, 13.0, 14.0, 10.0, 11.0, 7.0, 7.0, 4.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.894371032714844e-06, -9.564682841300964e-06, -9.234994649887085e-06, -8.905306458473206e-06, -8.575618267059326e-06, -8.245930075645447e-06, -7.916241884231567e-06, -7.586553692817688e-06, -7.256865501403809e-06, -6.927177309989929e-06, -6.59748911857605e-06, -6.26780092716217e-06, -5.938112735748291e-06, -5.608424544334412e-06, -5.278736352920532e-06, -4.949048161506653e-06, -4.6193599700927734e-06, -4.289671778678894e-06, -3.959983587265015e-06, -3.6302953958511353e-06, -3.300607204437256e-06, -2.9709190130233765e-06, -2.641230821609497e-06, -2.3115426301956177e-06, -1.9818544387817383e-06, -1.6521662473678589e-06, -1.3224780559539795e-06, -9.927898645401e-07, -6.631016731262207e-07, -3.334134817123413e-07, -3.725290298461914e-09, 3.259629011154175e-07, 6.556510925292969e-07, 9.853392839431763e-07, 1.3150274753570557e-06, 1.644715666770935e-06, 1.9744038581848145e-06, 2.304092049598694e-06, 2.6337802410125732e-06, 2.9634684324264526e-06, 3.293156623840332e-06, 3.6228448152542114e-06, 3.952533006668091e-06, 4.28222119808197e-06, 4.61190938949585e-06, 4.941597580909729e-06, 5.271285772323608e-06, 5.600973963737488e-06, 5.930662155151367e-06, 6.260350346565247e-06, 6.590038537979126e-06, 6.919726729393005e-06, 7.249414920806885e-06, 7.579103112220764e-06, 7.908791303634644e-06, 8.238479495048523e-06, 8.568167686462402e-06, 8.897855877876282e-06, 9.227544069290161e-06, 9.55723226070404e-06, 9.88692045211792e-06, 1.02166086435318e-05, 1.0546296834945679e-05, 1.0875985026359558e-05, 1.1205673217773438e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 10.0, 13.0, 18.0, 22.0, 43.0, 46.0, 64.0, 92.0, 130.0, 180.0, 285.0, 378.0, 597.0, 856.0, 1406.0, 2342.0, 4078.0, 8109.0, 18207.0, 53932.0, 215682.0, 493092.0, 171848.0, 44248.0, 15822.0, 7183.0, 3758.0, 2232.0, 1242.0, 852.0, 537.0, 355.0, 264.0, 173.0, 146.0, 91.0, 52.0, 48.0, 30.0, 20.0, 23.0, 10.0, 11.0, 4.0, 3.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02691650390625, -0.0260317325592041, -0.025146961212158203, -0.024262189865112305, -0.023377418518066406, -0.022492647171020508, -0.02160787582397461, -0.02072310447692871, -0.019838333129882812, -0.018953561782836914, -0.018068790435791016, -0.017184019088745117, -0.01629924774169922, -0.01541447639465332, -0.014529705047607422, -0.013644933700561523, -0.012760162353515625, -0.011875391006469727, -0.010990619659423828, -0.01010584831237793, -0.009221076965332031, -0.008336305618286133, -0.007451534271240234, -0.006566762924194336, -0.0056819915771484375, -0.004797220230102539, -0.003912448883056641, -0.003027677536010742, -0.0021429061889648438, -0.0012581348419189453, -0.0003733634948730469, 0.0005114078521728516, 0.00139617919921875, 0.0022809505462646484, 0.003165721893310547, 0.004050493240356445, 0.004935264587402344, 0.005820035934448242, 0.006704807281494141, 0.007589578628540039, 0.008474349975585938, 0.009359121322631836, 0.010243892669677734, 0.011128664016723633, 0.012013435363769531, 0.01289820671081543, 0.013782978057861328, 0.014667749404907227, 0.015552520751953125, 0.016437292098999023, 0.017322063446044922, 0.01820683479309082, 0.01909160614013672, 0.019976377487182617, 0.020861148834228516, 0.021745920181274414, 0.022630691528320312, 0.02351546287536621, 0.02440023422241211, 0.025285005569458008, 0.026169776916503906, 0.027054548263549805, 0.027939319610595703, 0.0288240909576416, 0.0297088623046875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 6.0, 7.0, 6.0, 12.0, 9.0, 17.0, 23.0, 30.0, 43.0, 31.0, 49.0, 39.0, 50.0, 67.0, 75.0, 67.0, 77.0, 48.0, 56.0, 55.0, 42.0, 40.0, 28.0, 18.0, 20.0, 19.0, 11.0, 8.0, 3.0, 6.0, 5.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0175628662109375, -0.017005443572998047, -0.016448020935058594, -0.01589059829711914, -0.015333175659179688, -0.014775753021240234, -0.014218330383300781, -0.013660907745361328, -0.013103485107421875, -0.012546062469482422, -0.011988639831542969, -0.011431217193603516, -0.010873794555664062, -0.01031637191772461, -0.009758949279785156, -0.009201526641845703, -0.00864410400390625, -0.008086681365966797, -0.007529258728027344, -0.006971836090087891, -0.0064144134521484375, -0.005856990814208984, -0.005299568176269531, -0.004742145538330078, -0.004184722900390625, -0.003627300262451172, -0.0030698776245117188, -0.0025124549865722656, -0.0019550323486328125, -0.0013976097106933594, -0.0008401870727539062, -0.0002827644348144531, 0.000274658203125, 0.0008320808410644531, 0.0013895034790039062, 0.0019469261169433594, 0.0025043487548828125, 0.0030617713928222656, 0.0036191940307617188, 0.004176616668701172, 0.004734039306640625, 0.005291461944580078, 0.005848884582519531, 0.006406307220458984, 0.0069637298583984375, 0.007521152496337891, 0.008078575134277344, 0.008635997772216797, 0.00919342041015625, 0.009750843048095703, 0.010308265686035156, 0.01086568832397461, 0.011423110961914062, 0.011980533599853516, 0.012537956237792969, 0.013095378875732422, 0.013652801513671875, 0.014210224151611328, 0.014767646789550781, 0.015325069427490234, 0.015882492065429688, 0.01643991470336914, 0.016997337341308594, 0.017554759979248047, 0.0181121826171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 8.0, 34.0, 77.0, 154.0, 273.0, 247.0, 118.0, 52.0, 26.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7593518495559692, -0.7416942715644836, -0.724036693572998, -0.7063791751861572, -0.6887215971946716, -0.671064019203186, -0.6534065008163452, -0.6357489228248596, -0.618091344833374, -0.6004337668418884, -0.5827761888504028, -0.565118670463562, -0.5474610924720764, -0.5298035144805908, -0.51214599609375, -0.4944884181022644, -0.4768308401107788, -0.4591732621192932, -0.44151571393013, -0.4238581657409668, -0.4062005877494812, -0.3885430097579956, -0.3708854615688324, -0.3532279133796692, -0.3355703353881836, -0.317912757396698, -0.3002552092075348, -0.2825976610183716, -0.264940083026886, -0.24728251993656158, -0.22962495684623718, -0.21196739375591278, -0.19430989027023315, -0.17665232717990875, -0.15899476408958435, -0.14133720099925995, -0.12367963790893555, -0.10602207481861115, -0.08836451172828674, -0.07070694863796234, -0.05304938554763794, -0.03539182245731354, -0.017734259366989136, -7.669627666473389e-05, 0.017580866813659668, 0.03523842990398407, 0.05289599299430847, 0.07055355608463287, 0.08821111917495728, 0.10586868226528168, 0.12352624535560608, 0.14118380844593048, 0.15884137153625488, 0.17649893462657928, 0.1941564977169037, 0.2118140608072281, 0.2294716238975525, 0.2471291869878769, 0.2647867500782013, 0.2824442982673645, 0.3001018762588501, 0.3177594542503357, 0.3354170024394989, 0.3530745506286621, 0.3707321286201477]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 8.0, 10.0, 6.0, 4.0, 5.0, 9.0, 11.0, 16.0, 14.0, 24.0, 20.0, 22.0, 19.0, 18.0, 38.0, 29.0, 29.0, 25.0, 33.0, 29.0, 39.0, 35.0, 27.0, 42.0, 37.0, 36.0, 35.0, 33.0, 36.0, 24.0, 27.0, 28.0, 28.0, 30.0, 18.0, 19.0, 16.0, 14.0, 13.0, 16.0, 10.0, 10.0, 8.0, 9.0, 9.0, 8.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0], "bins": [-0.1395571231842041, -0.13523133099079132, -0.13090552389621735, -0.12657973170280457, -0.12225393950939178, -0.11792813986539841, -0.11360234022140503, -0.10927654802799225, -0.10495074838399887, -0.1006249487400055, -0.09629915654659271, -0.09197335690259933, -0.08764755725860596, -0.08332176506519318, -0.0789959654211998, -0.07467016577720642, -0.07034437358379364, -0.06601857393980026, -0.06169278174638748, -0.057366982102394104, -0.053041186183691025, -0.048715390264987946, -0.04438959062099457, -0.04006379470229149, -0.03573799878358841, -0.03141220286488533, -0.027086405083537102, -0.022760607302188873, -0.018434811383485794, -0.014109015464782715, -0.009783217683434486, -0.005457419902086258, -0.0011316239833831787, 0.003194172866642475, 0.007519969716668129, 0.011845766566693783, 0.016171563416719437, 0.020497359335422516, 0.024823157116770744, 0.029148954898118973, 0.03347475081682205, 0.03780054673552513, 0.04212634265422821, 0.04645214229822159, 0.05077793821692467, 0.05510373413562775, 0.059429533779621124, 0.0637553334236145, 0.06808112561702728, 0.07240692526102066, 0.07673271745443344, 0.08105851709842682, 0.0853843092918396, 0.08971010893583298, 0.09403590857982635, 0.09836170077323914, 0.10268750041723251, 0.10701330006122589, 0.11133909225463867, 0.11566489189863205, 0.11999069154262543, 0.12431648373603821, 0.128642275929451, 0.13296808302402496, 0.13729387521743774]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 7.0, 7.0, 7.0, 13.0, 19.0, 22.0, 28.0, 62.0, 65.0, 84.0, 141.0, 252.0, 351.0, 586.0, 1156.0, 2346.0, 5459.0, 12252.0, 37312.0, 176533.0, 1261719.0, 2152111.0, 437212.0, 73465.0, 19568.0, 7033.0, 3179.0, 1478.0, 667.0, 368.0, 252.0, 138.0, 90.0, 91.0, 43.0, 41.0, 24.0, 24.0, 14.0, 14.0, 5.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.058837890625, -0.057066917419433594, -0.05529594421386719, -0.05352497100830078, -0.051753997802734375, -0.04998302459716797, -0.04821205139160156, -0.046441078186035156, -0.04467010498046875, -0.042899131774902344, -0.04112815856933594, -0.03935718536376953, -0.037586212158203125, -0.03581523895263672, -0.03404426574707031, -0.032273292541503906, -0.0305023193359375, -0.028731346130371094, -0.026960372924804688, -0.02518939971923828, -0.023418426513671875, -0.02164745330810547, -0.019876480102539062, -0.018105506896972656, -0.01633453369140625, -0.014563560485839844, -0.012792587280273438, -0.011021614074707031, -0.009250640869140625, -0.007479667663574219, -0.0057086944580078125, -0.003937721252441406, -0.002166748046875, -0.00039577484130859375, 0.0013751983642578125, 0.0031461715698242188, 0.004917144775390625, 0.006688117980957031, 0.008459091186523438, 0.010230064392089844, 0.01200103759765625, 0.013772010803222656, 0.015542984008789062, 0.01731395721435547, 0.019084930419921875, 0.02085590362548828, 0.022626876831054688, 0.024397850036621094, 0.0261688232421875, 0.027939796447753906, 0.029710769653320312, 0.03148174285888672, 0.033252716064453125, 0.03502368927001953, 0.03679466247558594, 0.038565635681152344, 0.04033660888671875, 0.042107582092285156, 0.04387855529785156, 0.04564952850341797, 0.047420501708984375, 0.04919147491455078, 0.05096244812011719, 0.052733421325683594, 0.05450439453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 19.0, 41.0, 58.0, 66.0, 113.0, 122.0, 150.0, 130.0, 100.0, 88.0, 44.0, 35.0, 18.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09039306640625, -0.0877676010131836, -0.08514213562011719, -0.08251667022705078, -0.07989120483398438, -0.07726573944091797, -0.07464027404785156, -0.07201480865478516, -0.06938934326171875, -0.06676387786865234, -0.06413841247558594, -0.06151294708251953, -0.058887481689453125, -0.05626201629638672, -0.05363655090332031, -0.051011085510253906, -0.0483856201171875, -0.045760154724121094, -0.04313468933105469, -0.04050922393798828, -0.037883758544921875, -0.03525829315185547, -0.03263282775878906, -0.030007362365722656, -0.02738189697265625, -0.024756431579589844, -0.022130966186523438, -0.01950550079345703, -0.016880035400390625, -0.014254570007324219, -0.011629104614257812, -0.009003639221191406, -0.006378173828125, -0.0037527084350585938, -0.0011272430419921875, 0.0014982223510742188, 0.004123687744140625, 0.006749153137207031, 0.009374618530273438, 0.012000083923339844, 0.01462554931640625, 0.017251014709472656, 0.019876480102539062, 0.02250194549560547, 0.025127410888671875, 0.02775287628173828, 0.030378341674804688, 0.033003807067871094, 0.0356292724609375, 0.038254737854003906, 0.04088020324707031, 0.04350566864013672, 0.046131134033203125, 0.04875659942626953, 0.05138206481933594, 0.054007530212402344, 0.05663299560546875, 0.059258460998535156, 0.06188392639160156, 0.06450939178466797, 0.06713485717773438, 0.06976032257080078, 0.07238578796386719, 0.0750112533569336, 0.07763671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 4.0, 8.0, 12.0, 15.0, 29.0, 45.0, 66.0, 107.0, 150.0, 245.0, 454.0, 950.0, 1877.0, 4846.0, 13819.0, 46873.0, 187578.0, 1104870.0, 2285974.0, 418308.0, 90202.0, 24477.0, 7752.0, 2879.0, 1226.0, 642.0, 341.0, 204.0, 125.0, 64.0, 54.0, 27.0, 14.0, 11.0, 12.0, 6.0, 7.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0418701171875, -0.04021167755126953, -0.03855323791503906, -0.036894798278808594, -0.035236358642578125, -0.033577919006347656, -0.03191947937011719, -0.03026103973388672, -0.02860260009765625, -0.02694416046142578, -0.025285720825195312, -0.023627281188964844, -0.021968841552734375, -0.020310401916503906, -0.018651962280273438, -0.01699352264404297, -0.0153350830078125, -0.013676643371582031, -0.012018203735351562, -0.010359764099121094, -0.008701324462890625, -0.007042884826660156, -0.0053844451904296875, -0.0037260055541992188, -0.00206756591796875, -0.00040912628173828125, 0.0012493133544921875, 0.0029077529907226562, 0.004566192626953125, 0.006224632263183594, 0.007883071899414062, 0.009541511535644531, 0.011199951171875, 0.012858390808105469, 0.014516830444335938, 0.016175270080566406, 0.017833709716796875, 0.019492149353027344, 0.021150588989257812, 0.02280902862548828, 0.02446746826171875, 0.02612590789794922, 0.027784347534179688, 0.029442787170410156, 0.031101226806640625, 0.032759666442871094, 0.03441810607910156, 0.03607654571533203, 0.0377349853515625, 0.03939342498779297, 0.04105186462402344, 0.042710304260253906, 0.044368743896484375, 0.046027183532714844, 0.04768562316894531, 0.04934406280517578, 0.05100250244140625, 0.05266094207763672, 0.05431938171386719, 0.055977821350097656, 0.057636260986328125, 0.059294700622558594, 0.06095314025878906, 0.06261157989501953, 0.06427001953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 12.0, 15.0, 23.0, 22.0, 30.0, 31.0, 64.0, 70.0, 96.0, 134.0, 159.0, 293.0, 360.0, 526.0, 552.0, 491.0, 369.0, 226.0, 171.0, 93.0, 85.0, 79.0, 46.0, 42.0, 23.0, 13.0, 11.0, 6.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06256103515625, -0.060884952545166016, -0.05920886993408203, -0.05753278732299805, -0.05585670471191406, -0.05418062210083008, -0.052504539489746094, -0.05082845687866211, -0.049152374267578125, -0.04747629165649414, -0.045800209045410156, -0.04412412643432617, -0.04244804382324219, -0.0407719612121582, -0.03909587860107422, -0.037419795989990234, -0.03574371337890625, -0.034067630767822266, -0.03239154815673828, -0.030715465545654297, -0.029039382934570312, -0.027363300323486328, -0.025687217712402344, -0.02401113510131836, -0.022335052490234375, -0.02065896987915039, -0.018982887268066406, -0.017306804656982422, -0.015630722045898438, -0.013954639434814453, -0.012278556823730469, -0.010602474212646484, -0.0089263916015625, -0.007250308990478516, -0.005574226379394531, -0.003898143768310547, -0.0022220611572265625, -0.0005459785461425781, 0.0011301040649414062, 0.0028061866760253906, 0.004482269287109375, 0.006158351898193359, 0.007834434509277344, 0.009510517120361328, 0.011186599731445312, 0.012862682342529297, 0.014538764953613281, 0.016214847564697266, 0.01789093017578125, 0.019567012786865234, 0.02124309539794922, 0.022919178009033203, 0.024595260620117188, 0.026271343231201172, 0.027947425842285156, 0.02962350845336914, 0.031299591064453125, 0.03297567367553711, 0.034651756286621094, 0.03632783889770508, 0.03800392150878906, 0.03968000411987305, 0.04135608673095703, 0.043032169342041016, 0.044708251953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 22.0, 82.0, 146.0, 297.0, 230.0, 132.0, 59.0, 17.0, 9.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0928850173950195, -1.0705254077911377, -1.0481659173965454, -1.0258063077926636, -1.0034466981887817, -0.9810871481895447, -0.9587275981903076, -0.9363679885864258, -0.914008378982544, -0.8916488289833069, -0.869289219379425, -0.846929669380188, -0.8245700597763062, -0.8022105097770691, -0.779850959777832, -0.7574913501739502, -0.7351318001747131, -0.7127722501754761, -0.6904126405715942, -0.6680530905723572, -0.6456934809684753, -0.6233339309692383, -0.6009743213653564, -0.5786147713661194, -0.5562552213668823, -0.5338956713676453, -0.5115360617637634, -0.48917651176452637, -0.46681690216064453, -0.44445735216140747, -0.422097772359848, -0.3997381925582886, -0.3773786425590515, -0.35501906275749207, -0.3326594829559326, -0.31029993295669556, -0.2879403233528137, -0.26558077335357666, -0.2432211935520172, -0.22086161375045776, -0.19850203394889832, -0.17614245414733887, -0.15378287434577942, -0.13142330944538116, -0.10906372964382172, -0.08670414984226227, -0.06434458494186401, -0.041985005140304565, -0.019625425338745117, 0.0027341507375240326, 0.025093726813793182, 0.047453299164772034, 0.06981287896633148, 0.09217245876789093, 0.11453202366828918, 0.13689160346984863, 0.15925118327140808, 0.18161076307296753, 0.20397034287452698, 0.22632990777492523, 0.24868948757648468, 0.2710490822792053, 0.2934086322784424, 0.31576821208000183, 0.3381277918815613]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 1.0, 1.0, 8.0, 7.0, 10.0, 12.0, 13.0, 23.0, 23.0, 29.0, 25.0, 27.0, 28.0, 40.0, 44.0, 46.0, 39.0, 37.0, 40.0, 44.0, 40.0, 55.0, 31.0, 49.0, 39.0, 44.0, 43.0, 28.0, 23.0, 30.0, 25.0, 22.0, 8.0, 8.0, 18.0, 12.0, 7.0, 4.0, 3.0, 5.0, 8.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.17290765047073364, -0.1673312932252884, -0.16175492107868195, -0.1561785638332367, -0.15060219168663025, -0.145025834441185, -0.13944947719573975, -0.1338731050491333, -0.12829673290252686, -0.12272036820650101, -0.11714400351047516, -0.11156764626502991, -0.10599127411842346, -0.10041491687297821, -0.09483855217695236, -0.08926218748092651, -0.08368583023548126, -0.07810946553945541, -0.07253310084342957, -0.06695674359798431, -0.06138037517666817, -0.05580401048064232, -0.05022764950990677, -0.04465128481388092, -0.03907492011785507, -0.033498555421829224, -0.027922192588448524, -0.022345829755067825, -0.016769465059041977, -0.011193100363016129, -0.005616739392280579, -4.0374696254730225e-05, 0.005535989999771118, 0.011112353764474392, 0.016688717529177666, 0.022265080362558365, 0.027841445058584213, 0.03341780975461006, 0.03899417072534561, 0.04457053542137146, 0.05014690011739731, 0.05572326481342316, 0.061299629509449005, 0.06687599420547485, 0.0724523514509201, 0.07802872359752655, 0.0836050808429718, 0.08918144553899765, 0.0947578102350235, 0.10033417493104935, 0.1059105396270752, 0.11148689687252045, 0.11706326901912689, 0.12263962626457214, 0.1282159984111786, 0.13379235565662384, 0.1393687129020691, 0.14494507014751434, 0.1505214422941208, 0.15609779953956604, 0.16167417168617249, 0.16725052893161774, 0.172826886177063, 0.17840325832366943, 0.18397963047027588]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 10.0, 11.0, 13.0, 15.0, 17.0, 25.0, 36.0, 46.0, 79.0, 105.0, 118.0, 252.0, 397.0, 724.0, 1309.0, 3072.0, 8928.0, 30639.0, 122355.0, 451251.0, 323098.0, 75481.0, 19787.0, 5853.0, 2283.0, 1049.0, 554.0, 365.0, 231.0, 143.0, 102.0, 70.0, 33.0, 25.0, 17.0, 19.0, 7.0, 8.0, 12.0, 6.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09149169921875, -0.08870506286621094, -0.08591842651367188, -0.08313179016113281, -0.08034515380859375, -0.07755851745605469, -0.07477188110351562, -0.07198524475097656, -0.0691986083984375, -0.06641197204589844, -0.06362533569335938, -0.06083869934082031, -0.05805206298828125, -0.05526542663574219, -0.052478790283203125, -0.04969215393066406, -0.046905517578125, -0.04411888122558594, -0.041332244873046875, -0.03854560852050781, -0.03575897216796875, -0.03297233581542969, -0.030185699462890625, -0.027399063110351562, -0.0246124267578125, -0.021825790405273438, -0.019039154052734375, -0.016252517700195312, -0.01346588134765625, -0.010679244995117188, -0.007892608642578125, -0.0051059722900390625, -0.0023193359375, 0.0004673004150390625, 0.003253936767578125, 0.0060405731201171875, 0.00882720947265625, 0.011613845825195312, 0.014400482177734375, 0.017187118530273438, 0.0199737548828125, 0.022760391235351562, 0.025547027587890625, 0.028333663940429688, 0.03112030029296875, 0.03390693664550781, 0.036693572998046875, 0.03948020935058594, 0.042266845703125, 0.04505348205566406, 0.047840118408203125, 0.05062675476074219, 0.05341339111328125, 0.05620002746582031, 0.058986663818359375, 0.06177330017089844, 0.0645599365234375, 0.06734657287597656, 0.07013320922851562, 0.07291984558105469, 0.07570648193359375, 0.07849311828613281, 0.08127975463867188, 0.08406639099121094, 0.08685302734375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 8.0, 18.0, 37.0, 59.0, 73.0, 101.0, 119.0, 126.0, 128.0, 112.0, 105.0, 55.0, 29.0, 18.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0894775390625, -0.08688831329345703, -0.08429908752441406, -0.0817098617553711, -0.07912063598632812, -0.07653141021728516, -0.07394218444824219, -0.07135295867919922, -0.06876373291015625, -0.06617450714111328, -0.06358528137207031, -0.060996055603027344, -0.058406829833984375, -0.055817604064941406, -0.05322837829589844, -0.05063915252685547, -0.0480499267578125, -0.04546070098876953, -0.04287147521972656, -0.040282249450683594, -0.037693023681640625, -0.035103797912597656, -0.03251457214355469, -0.02992534637451172, -0.02733612060546875, -0.02474689483642578, -0.022157669067382812, -0.019568443298339844, -0.016979217529296875, -0.014389991760253906, -0.011800765991210938, -0.009211540222167969, -0.006622314453125, -0.004033088684082031, -0.0014438629150390625, 0.0011453628540039062, 0.003734588623046875, 0.006323814392089844, 0.008913040161132812, 0.011502265930175781, 0.01409149169921875, 0.01668071746826172, 0.019269943237304688, 0.021859169006347656, 0.024448394775390625, 0.027037620544433594, 0.029626846313476562, 0.03221607208251953, 0.0348052978515625, 0.03739452362060547, 0.03998374938964844, 0.042572975158691406, 0.045162200927734375, 0.047751426696777344, 0.05034065246582031, 0.05292987823486328, 0.05551910400390625, 0.05810832977294922, 0.06069755554199219, 0.06328678131103516, 0.06587600708007812, 0.0684652328491211, 0.07105445861816406, 0.07364368438720703, 0.07623291015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 7.0, 9.0, 17.0, 19.0, 26.0, 33.0, 48.0, 72.0, 130.0, 174.0, 341.0, 615.0, 1425.0, 3865.0, 12553.0, 41900.0, 151336.0, 466166.0, 268477.0, 70342.0, 20693.0, 6214.0, 2127.0, 833.0, 448.0, 218.0, 141.0, 102.0, 75.0, 47.0, 31.0, 14.0, 22.0, 11.0, 11.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.08819580078125, -0.08585691452026367, -0.08351802825927734, -0.08117914199829102, -0.07884025573730469, -0.07650136947631836, -0.07416248321533203, -0.0718235969543457, -0.06948471069335938, -0.06714582443237305, -0.06480693817138672, -0.06246805191040039, -0.06012916564941406, -0.057790279388427734, -0.055451393127441406, -0.05311250686645508, -0.05077362060546875, -0.04843473434448242, -0.046095848083496094, -0.043756961822509766, -0.04141807556152344, -0.03907918930053711, -0.03674030303955078, -0.03440141677856445, -0.032062530517578125, -0.029723644256591797, -0.02738475799560547, -0.02504587173461914, -0.022706985473632812, -0.020368099212646484, -0.018029212951660156, -0.015690326690673828, -0.0133514404296875, -0.011012554168701172, -0.008673667907714844, -0.006334781646728516, -0.0039958953857421875, -0.0016570091247558594, 0.0006818771362304688, 0.003020763397216797, 0.005359649658203125, 0.007698535919189453, 0.010037422180175781, 0.01237630844116211, 0.014715194702148438, 0.017054080963134766, 0.019392967224121094, 0.021731853485107422, 0.02407073974609375, 0.026409626007080078, 0.028748512268066406, 0.031087398529052734, 0.03342628479003906, 0.03576517105102539, 0.03810405731201172, 0.04044294357299805, 0.042781829833984375, 0.0451207160949707, 0.04745960235595703, 0.04979848861694336, 0.05213737487792969, 0.054476261138916016, 0.056815147399902344, 0.05915403366088867, 0.061492919921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 8.0, 5.0, 11.0, 8.0, 13.0, 13.0, 10.0, 20.0, 18.0, 30.0, 30.0, 42.0, 41.0, 28.0, 56.0, 58.0, 48.0, 52.0, 59.0, 46.0, 43.0, 39.0, 50.0, 35.0, 40.0, 24.0, 18.0, 28.0, 33.0, 16.0, 15.0, 8.0, 3.0, 12.0, 9.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07757568359375, -0.0751953125, -0.07281494140625, -0.0704345703125, -0.06805419921875, -0.065673828125, -0.06329345703125, -0.0609130859375, -0.05853271484375, -0.05615234375, -0.05377197265625, -0.0513916015625, -0.04901123046875, -0.046630859375, -0.04425048828125, -0.0418701171875, -0.03948974609375, -0.037109375, -0.03472900390625, -0.0323486328125, -0.02996826171875, -0.027587890625, -0.02520751953125, -0.0228271484375, -0.02044677734375, -0.01806640625, -0.01568603515625, -0.0133056640625, -0.01092529296875, -0.008544921875, -0.00616455078125, -0.0037841796875, -0.00140380859375, 0.0009765625, 0.00335693359375, 0.0057373046875, 0.00811767578125, 0.010498046875, 0.01287841796875, 0.0152587890625, 0.01763916015625, 0.02001953125, 0.02239990234375, 0.0247802734375, 0.02716064453125, 0.029541015625, 0.03192138671875, 0.0343017578125, 0.03668212890625, 0.0390625, 0.04144287109375, 0.0438232421875, 0.04620361328125, 0.048583984375, 0.05096435546875, 0.0533447265625, 0.05572509765625, 0.05810546875, 0.06048583984375, 0.0628662109375, 0.06524658203125, 0.067626953125, 0.07000732421875, 0.0723876953125, 0.07476806640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 6.0, 8.0, 10.0, 33.0, 25.0, 40.0, 57.0, 94.0, 138.0, 205.0, 319.0, 512.0, 828.0, 1438.0, 2635.0, 5046.0, 10754.0, 23581.0, 54375.0, 130019.0, 294140.0, 294031.0, 129873.0, 54511.0, 23750.0, 10564.0, 5152.0, 2620.0, 1387.0, 881.0, 511.0, 367.0, 210.0, 126.0, 104.0, 76.0, 48.0, 34.0, 14.0, 12.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01654052734375, -0.016023635864257812, -0.015506744384765625, -0.014989852905273438, -0.01447296142578125, -0.013956069946289062, -0.013439178466796875, -0.012922286987304688, -0.0124053955078125, -0.011888504028320312, -0.011371612548828125, -0.010854721069335938, -0.01033782958984375, -0.009820938110351562, -0.009304046630859375, -0.008787155151367188, -0.008270263671875, -0.0077533721923828125, -0.007236480712890625, -0.0067195892333984375, -0.00620269775390625, -0.0056858062744140625, -0.005168914794921875, -0.0046520233154296875, -0.0041351318359375, -0.0036182403564453125, -0.003101348876953125, -0.0025844573974609375, -0.00206756591796875, -0.0015506744384765625, -0.001033782958984375, -0.0005168914794921875, 0.0, 0.0005168914794921875, 0.001033782958984375, 0.0015506744384765625, 0.00206756591796875, 0.0025844573974609375, 0.003101348876953125, 0.0036182403564453125, 0.0041351318359375, 0.0046520233154296875, 0.005168914794921875, 0.0056858062744140625, 0.00620269775390625, 0.0067195892333984375, 0.007236480712890625, 0.0077533721923828125, 0.008270263671875, 0.008787155151367188, 0.009304046630859375, 0.009820938110351562, 0.01033782958984375, 0.010854721069335938, 0.011371612548828125, 0.011888504028320312, 0.0124053955078125, 0.012922286987304688, 0.013439178466796875, 0.013956069946289062, 0.01447296142578125, 0.014989852905273438, 0.015506744384765625, 0.016023635864257812, 0.01654052734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 3.0, 15.0, 12.0, 36.0, 36.0, 48.0, 83.0, 96.0, 104.0, 119.0, 76.0, 115.0, 82.0, 46.0, 31.0, 28.0, 16.0, 20.0, 6.0, 8.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.569789886474609e-06, -7.164664566516876e-06, -6.759539246559143e-06, -6.35441392660141e-06, -5.949288606643677e-06, -5.544163286685944e-06, -5.1390379667282104e-06, -4.733912646770477e-06, -4.328787326812744e-06, -3.923662006855011e-06, -3.518536686897278e-06, -3.1134113669395447e-06, -2.7082860469818115e-06, -2.3031607270240784e-06, -1.8980354070663452e-06, -1.492910087108612e-06, -1.087784767150879e-06, -6.826594471931458e-07, -2.775341272354126e-07, 1.2759119272232056e-07, 5.327165126800537e-07, 9.378418326377869e-07, 1.34296715259552e-06, 1.7480924725532532e-06, 2.1532177925109863e-06, 2.5583431124687195e-06, 2.9634684324264526e-06, 3.368593752384186e-06, 3.773719072341919e-06, 4.178844392299652e-06, 4.583969712257385e-06, 4.989095032215118e-06, 5.3942203521728516e-06, 5.799345672130585e-06, 6.204470992088318e-06, 6.609596312046051e-06, 7.014721632003784e-06, 7.419846951961517e-06, 7.82497227191925e-06, 8.230097591876984e-06, 8.635222911834717e-06, 9.04034823179245e-06, 9.445473551750183e-06, 9.850598871707916e-06, 1.025572419166565e-05, 1.0660849511623383e-05, 1.1065974831581116e-05, 1.1471100151538849e-05, 1.1876225471496582e-05, 1.2281350791454315e-05, 1.2686476111412048e-05, 1.3091601431369781e-05, 1.3496726751327515e-05, 1.3901852071285248e-05, 1.4306977391242981e-05, 1.4712102711200714e-05, 1.5117228031158447e-05, 1.552235335111618e-05, 1.5927478671073914e-05, 1.6332603991031647e-05, 1.673772931098938e-05, 1.7142854630947113e-05, 1.7547979950904846e-05, 1.795310527086258e-05, 1.8358230590820312e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 6.0, 6.0, 4.0, 13.0, 20.0, 15.0, 36.0, 38.0, 68.0, 88.0, 179.0, 283.0, 541.0, 947.0, 1712.0, 3369.0, 6683.0, 14961.0, 37889.0, 100306.0, 255981.0, 349795.0, 167383.0, 63411.0, 24328.0, 10370.0, 4780.0, 2361.0, 1252.0, 676.0, 392.0, 232.0, 145.0, 98.0, 56.0, 36.0, 23.0, 19.0, 11.0, 9.0, 5.0, 11.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.020660400390625, -0.02003931999206543, -0.01941823959350586, -0.01879715919494629, -0.01817607879638672, -0.01755499839782715, -0.016933917999267578, -0.016312837600708008, -0.015691757202148438, -0.015070676803588867, -0.014449596405029297, -0.013828516006469727, -0.013207435607910156, -0.012586355209350586, -0.011965274810791016, -0.011344194412231445, -0.010723114013671875, -0.010102033615112305, -0.009480953216552734, -0.008859872817993164, -0.008238792419433594, -0.0076177120208740234, -0.006996631622314453, -0.006375551223754883, -0.0057544708251953125, -0.005133390426635742, -0.004512310028076172, -0.0038912296295166016, -0.0032701492309570312, -0.002649068832397461, -0.0020279884338378906, -0.0014069080352783203, -0.00078582763671875, -0.0001647472381591797, 0.0004563331604003906, 0.001077413558959961, 0.0016984939575195312, 0.0023195743560791016, 0.002940654754638672, 0.003561735153198242, 0.0041828155517578125, 0.004803895950317383, 0.005424976348876953, 0.0060460567474365234, 0.006667137145996094, 0.007288217544555664, 0.007909297943115234, 0.008530378341674805, 0.009151458740234375, 0.009772539138793945, 0.010393619537353516, 0.011014699935913086, 0.011635780334472656, 0.012256860733032227, 0.012877941131591797, 0.013499021530151367, 0.014120101928710938, 0.014741182327270508, 0.015362262725830078, 0.01598334312438965, 0.01660442352294922, 0.01722550392150879, 0.01784658432006836, 0.01846766471862793, 0.0190887451171875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 7.0, 9.0, 10.0, 19.0, 20.0, 20.0, 26.0, 27.0, 23.0, 37.0, 50.0, 53.0, 57.0, 57.0, 64.0, 53.0, 47.0, 50.0, 58.0, 45.0, 43.0, 31.0, 34.0, 22.0, 15.0, 21.0, 17.0, 16.0, 7.0, 7.0, 12.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0158538818359375, -0.015375614166259766, -0.014897346496582031, -0.014419078826904297, -0.013940811157226562, -0.013462543487548828, -0.012984275817871094, -0.01250600814819336, -0.012027740478515625, -0.01154947280883789, -0.011071205139160156, -0.010592937469482422, -0.010114669799804688, -0.009636402130126953, -0.009158134460449219, -0.008679866790771484, -0.00820159912109375, -0.007723331451416016, -0.007245063781738281, -0.006766796112060547, -0.0062885284423828125, -0.005810260772705078, -0.005331993103027344, -0.004853725433349609, -0.004375457763671875, -0.0038971900939941406, -0.0034189224243164062, -0.002940654754638672, -0.0024623870849609375, -0.001984119415283203, -0.0015058517456054688, -0.0010275840759277344, -0.00054931640625, -7.104873657226562e-05, 0.00040721893310546875, 0.0008854866027832031, 0.0013637542724609375, 0.0018420219421386719, 0.0023202896118164062, 0.0027985572814941406, 0.003276824951171875, 0.0037550926208496094, 0.004233360290527344, 0.004711627960205078, 0.0051898956298828125, 0.005668163299560547, 0.006146430969238281, 0.006624698638916016, 0.00710296630859375, 0.007581233978271484, 0.008059501647949219, 0.008537769317626953, 0.009016036987304688, 0.009494304656982422, 0.009972572326660156, 0.01045083999633789, 0.010929107666015625, 0.01140737533569336, 0.011885643005371094, 0.012363910675048828, 0.012842178344726562, 0.013320446014404297, 0.013798713684082031, 0.014276981353759766, 0.0147552490234375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 19.0, 19.0, 35.0, 50.0, 69.0, 108.0, 103.0, 134.0, 133.0, 97.0, 76.0, 64.0, 37.0, 8.0, 8.0, 9.0, 9.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.26612961292266846, -0.25767847895622253, -0.2492273449897766, -0.2407762110233307, -0.23232507705688477, -0.22387394309043884, -0.21542279422283173, -0.2069716602563858, -0.19852052628993988, -0.19006939232349396, -0.18161825835704803, -0.1731671243906021, -0.164715975522995, -0.15626484155654907, -0.14781370759010315, -0.13936257362365723, -0.1309114396572113, -0.12246030569076538, -0.11400917172431946, -0.10555803030729294, -0.09710689634084702, -0.08865576237440109, -0.08020462095737457, -0.07175348699092865, -0.06330235302448273, -0.054851219058036804, -0.04640008136630058, -0.03794894367456436, -0.02949780970811844, -0.021046675741672516, -0.012595538049936295, -0.004144400358200073, 0.004306763410568237, 0.01275789923965931, 0.02120903506875038, 0.029660170897841454, 0.038111306726932526, 0.04656244069337845, 0.05501357838511467, 0.06346471607685089, 0.07191585004329681, 0.08036698400974274, 0.08881811797618866, 0.09726925939321518, 0.1057203933596611, 0.11417152732610703, 0.12262266874313354, 0.13107380270957947, 0.1395249366760254, 0.1479760706424713, 0.15642720460891724, 0.16487833857536316, 0.17332947254180908, 0.181780606508255, 0.19023175537586212, 0.19868288934230804, 0.20713402330875397, 0.2155851572751999, 0.2240362912416458, 0.23248742520809174, 0.24093857407569885, 0.24938970804214478, 0.2578408420085907, 0.2662919759750366, 0.27474310994148254]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 1.0, 5.0, 10.0, 5.0, 17.0, 9.0, 18.0, 14.0, 22.0, 24.0, 27.0, 37.0, 25.0, 29.0, 36.0, 41.0, 48.0, 36.0, 46.0, 33.0, 46.0, 33.0, 45.0, 34.0, 36.0, 34.0, 31.0, 46.0, 33.0, 28.0, 26.0, 23.0, 18.0, 18.0, 19.0, 15.0, 6.0, 5.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.16888469457626343, -0.16344721615314484, -0.15800973773002625, -0.15257225930690765, -0.14713478088378906, -0.14169730246067047, -0.13625982403755188, -0.1308223307132721, -0.1253848671913147, -0.1199473887681961, -0.11450991034507751, -0.10907243192195892, -0.10363495349884033, -0.09819747507572174, -0.09275998920202255, -0.08732251077890396, -0.08188502490520477, -0.07644754648208618, -0.07101006805896759, -0.065572589635849, -0.06013510748744011, -0.05469762906432152, -0.04926014691591263, -0.04382266849279404, -0.038385190069675446, -0.032947711646556854, -0.027510231360793114, -0.022072751075029373, -0.016635272651910782, -0.01119779422879219, -0.005760312080383301, -0.00032283365726470947, 0.005114644765853882, 0.010552124120295048, 0.015989603474736214, 0.021427083760499954, 0.026864562183618546, 0.03230204060673714, 0.03773952275514603, 0.04317700117826462, 0.04861447960138321, 0.0540519580245018, 0.05948943644762039, 0.06492692232131958, 0.07036440074443817, 0.07580187916755676, 0.08123935759067535, 0.08667683601379395, 0.09211431443691254, 0.09755179286003113, 0.10298927128314972, 0.10842674970626831, 0.1138642281293869, 0.1193017065525055, 0.12473919242620468, 0.13017666339874268, 0.13561415672302246, 0.14105163514614105, 0.14648911356925964, 0.15192659199237823, 0.15736407041549683, 0.16280154883861542, 0.168239027261734, 0.1736765205860138, 0.1791139841079712]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 11.0, 6.0, 7.0, 20.0, 15.0, 16.0, 25.0, 64.0, 80.0, 125.0, 265.0, 403.0, 851.0, 2023.0, 5443.0, 16532.0, 82865.0, 989495.0, 2668665.0, 366349.0, 44640.0, 10172.0, 3657.0, 1355.0, 528.0, 266.0, 142.0, 87.0, 59.0, 27.0, 31.0, 12.0, 12.0, 12.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06524658203125, -0.0629415512084961, -0.06063652038574219, -0.05833148956298828, -0.056026458740234375, -0.05372142791748047, -0.05141639709472656, -0.049111366271972656, -0.04680633544921875, -0.044501304626464844, -0.04219627380371094, -0.03989124298095703, -0.037586212158203125, -0.03528118133544922, -0.03297615051269531, -0.030671119689941406, -0.0283660888671875, -0.026061058044433594, -0.023756027221679688, -0.02145099639892578, -0.019145965576171875, -0.01684093475341797, -0.014535903930664062, -0.012230873107910156, -0.00992584228515625, -0.007620811462402344, -0.0053157806396484375, -0.0030107498168945312, -0.000705718994140625, 0.0015993118286132812, 0.0039043426513671875, 0.006209373474121094, 0.008514404296875, 0.010819435119628906, 0.013124465942382812, 0.015429496765136719, 0.017734527587890625, 0.02003955841064453, 0.022344589233398438, 0.024649620056152344, 0.02695465087890625, 0.029259681701660156, 0.03156471252441406, 0.03386974334716797, 0.036174774169921875, 0.03847980499267578, 0.04078483581542969, 0.043089866638183594, 0.0453948974609375, 0.047699928283691406, 0.05000495910644531, 0.05230998992919922, 0.054615020751953125, 0.05692005157470703, 0.05922508239746094, 0.061530113220214844, 0.06383514404296875, 0.06614017486572266, 0.06844520568847656, 0.07075023651123047, 0.07305526733398438, 0.07536029815673828, 0.07766532897949219, 0.0799703598022461, 0.082275390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 17.0, 30.0, 51.0, 54.0, 111.0, 130.0, 132.0, 148.0, 126.0, 88.0, 44.0, 36.0, 17.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0882568359375, -0.08563041687011719, -0.08300399780273438, -0.08037757873535156, -0.07775115966796875, -0.07512474060058594, -0.07249832153320312, -0.06987190246582031, -0.0672454833984375, -0.06461906433105469, -0.061992645263671875, -0.05936622619628906, -0.05673980712890625, -0.05411338806152344, -0.051486968994140625, -0.04886054992675781, -0.046234130859375, -0.04360771179199219, -0.040981292724609375, -0.03835487365722656, -0.03572845458984375, -0.03310203552246094, -0.030475616455078125, -0.027849197387695312, -0.0252227783203125, -0.022596359252929688, -0.019969940185546875, -0.017343521118164062, -0.01471710205078125, -0.012090682983398438, -0.009464263916015625, -0.0068378448486328125, -0.00421142578125, -0.0015850067138671875, 0.001041412353515625, 0.0036678314208984375, 0.00629425048828125, 0.008920669555664062, 0.011547088623046875, 0.014173507690429688, 0.0167999267578125, 0.019426345825195312, 0.022052764892578125, 0.024679183959960938, 0.02730560302734375, 0.029932022094726562, 0.032558441162109375, 0.03518486022949219, 0.037811279296875, 0.04043769836425781, 0.043064117431640625, 0.04569053649902344, 0.04831695556640625, 0.05094337463378906, 0.053569793701171875, 0.05619621276855469, 0.0588226318359375, 0.06144905090332031, 0.06407546997070312, 0.06670188903808594, 0.06932830810546875, 0.07195472717285156, 0.07458114624023438, 0.07720756530761719, 0.079833984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 4.0, 18.0, 19.0, 21.0, 39.0, 53.0, 75.0, 111.0, 195.0, 369.0, 720.0, 1532.0, 4525.0, 17304.0, 91952.0, 755627.0, 2860610.0, 388592.0, 55216.0, 11435.0, 3335.0, 1224.0, 552.0, 277.0, 170.0, 85.0, 68.0, 43.0, 33.0, 17.0, 10.0, 16.0, 11.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060699462890625, -0.05839681625366211, -0.05609416961669922, -0.05379152297973633, -0.05148887634277344, -0.04918622970581055, -0.046883583068847656, -0.044580936431884766, -0.042278289794921875, -0.039975643157958984, -0.037672996520996094, -0.0353703498840332, -0.03306770324707031, -0.030765056610107422, -0.02846240997314453, -0.02615976333618164, -0.02385711669921875, -0.02155447006225586, -0.01925182342529297, -0.016949176788330078, -0.014646530151367188, -0.012343883514404297, -0.010041236877441406, -0.007738590240478516, -0.005435943603515625, -0.0031332969665527344, -0.0008306503295898438, 0.0014719963073730469, 0.0037746429443359375, 0.006077289581298828, 0.008379936218261719, 0.01068258285522461, 0.0129852294921875, 0.01528787612915039, 0.01759052276611328, 0.019893169403076172, 0.022195816040039062, 0.024498462677001953, 0.026801109313964844, 0.029103755950927734, 0.031406402587890625, 0.033709049224853516, 0.036011695861816406, 0.0383143424987793, 0.04061698913574219, 0.04291963577270508, 0.04522228240966797, 0.04752492904663086, 0.04982757568359375, 0.05213022232055664, 0.05443286895751953, 0.05673551559448242, 0.05903816223144531, 0.0613408088684082, 0.0636434555053711, 0.06594610214233398, 0.06824874877929688, 0.07055139541625977, 0.07285404205322266, 0.07515668869018555, 0.07745933532714844, 0.07976198196411133, 0.08206462860107422, 0.08436727523803711, 0.086669921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 11.0, 16.0, 10.0, 24.0, 20.0, 32.0, 41.0, 60.0, 76.0, 89.0, 124.0, 160.0, 227.0, 334.0, 419.0, 518.0, 460.0, 364.0, 279.0, 219.0, 151.0, 104.0, 73.0, 52.0, 47.0, 28.0, 35.0, 19.0, 11.0, 14.0, 7.0, 12.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05029296875, -0.04875755310058594, -0.047222137451171875, -0.04568672180175781, -0.04415130615234375, -0.04261589050292969, -0.041080474853515625, -0.03954505920410156, -0.0380096435546875, -0.03647422790527344, -0.034938812255859375, -0.03340339660644531, -0.03186798095703125, -0.030332565307617188, -0.028797149658203125, -0.027261734008789062, -0.025726318359375, -0.024190902709960938, -0.022655487060546875, -0.021120071411132812, -0.01958465576171875, -0.018049240112304688, -0.016513824462890625, -0.014978408813476562, -0.0134429931640625, -0.011907577514648438, -0.010372161865234375, -0.008836746215820312, -0.00730133056640625, -0.0057659149169921875, -0.004230499267578125, -0.0026950836181640625, -0.00115966796875, 0.0003757476806640625, 0.001911163330078125, 0.0034465789794921875, 0.00498199462890625, 0.0065174102783203125, 0.008052825927734375, 0.009588241577148438, 0.0111236572265625, 0.012659072875976562, 0.014194488525390625, 0.015729904174804688, 0.01726531982421875, 0.018800735473632812, 0.020336151123046875, 0.021871566772460938, 0.023406982421875, 0.024942398071289062, 0.026477813720703125, 0.028013229370117188, 0.02954864501953125, 0.031084060668945312, 0.032619476318359375, 0.03415489196777344, 0.0356903076171875, 0.03722572326660156, 0.038761138916015625, 0.04029655456542969, 0.04183197021484375, 0.04336738586425781, 0.044902801513671875, 0.04643821716308594, 0.0479736328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 43.0, 79.0, 174.0, 228.0, 218.0, 147.0, 68.0, 17.0, 9.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39122310280799866, -0.36937573552131653, -0.3475283682346344, -0.32568100094795227, -0.30383363366127014, -0.281986266374588, -0.2601388692855835, -0.23829151690006256, -0.21644414961338043, -0.1945967823266983, -0.17274941504001617, -0.15090203285217285, -0.12905466556549072, -0.10720730572938919, -0.08535993099212646, -0.06351256370544434, -0.04166519641876221, -0.01981782726943493, 0.0020295418798923492, 0.023876912891864777, 0.045724280178546906, 0.06757164746522903, 0.08941902220249176, 0.11126638948917389, 0.13311375677585602, 0.15496112406253815, 0.17680849134922028, 0.1986558735370636, 0.22050324082374573, 0.24235060811042786, 0.26419797539711, 0.2860453426837921, 0.30789273977279663, 0.32974010705947876, 0.3515874743461609, 0.373434841632843, 0.39528220891952515, 0.4171295762062073, 0.4389769434928894, 0.46082431077957153, 0.48267167806625366, 0.5045190453529358, 0.5263664126396179, 0.5482137799263, 0.5700611472129822, 0.5919085144996643, 0.6137558817863464, 0.6356032490730286, 0.6574506759643555, 0.6792980432510376, 0.7011454105377197, 0.7229927778244019, 0.744840145111084, 0.7666875123977661, 0.7885348796844482, 0.8103822469711304, 0.8322296142578125, 0.8540769815444946, 0.8759243488311768, 0.8977717161178589, 0.919619083404541, 0.9414664506912231, 0.9633138179779053, 0.9851611852645874, 1.0070085525512695]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 5.0, 11.0, 13.0, 4.0, 19.0, 14.0, 23.0, 19.0, 22.0, 18.0, 27.0, 23.0, 35.0, 39.0, 28.0, 33.0, 35.0, 27.0, 43.0, 29.0, 38.0, 44.0, 41.0, 36.0, 34.0, 36.0, 37.0, 34.0, 37.0, 21.0, 22.0, 18.0, 14.0, 19.0, 12.0, 17.0, 11.0, 10.0, 8.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1346113085746765, -0.1298602968454361, -0.12510928511619568, -0.12035828828811646, -0.11560727655887604, -0.11085626482963562, -0.1061052605509758, -0.10135425627231598, -0.09660324454307556, -0.09185223281383514, -0.08710122853517532, -0.0823502242565155, -0.07759921252727509, -0.07284820079803467, -0.06809719651937485, -0.06334619224071503, -0.05859518051147461, -0.05384417250752449, -0.04909316450357437, -0.04434215649962425, -0.03959114849567413, -0.034840140491724014, -0.030089132487773895, -0.025338124483823776, -0.020587116479873657, -0.015836108475923538, -0.01108510047197342, -0.0063340924680233, -0.0015830844640731812, 0.003167923539876938, 0.007918931543827057, 0.012669939547777176, 0.017420947551727295, 0.022171955555677414, 0.026922963559627533, 0.03167397156357765, 0.03642497956752777, 0.04117598757147789, 0.04592699557542801, 0.05067800357937813, 0.05542901158332825, 0.060180019587278366, 0.06493102759122849, 0.0696820318698883, 0.07443304359912872, 0.07918405532836914, 0.08393505960702896, 0.08868606388568878, 0.0934370756149292, 0.09818808734416962, 0.10293909162282944, 0.10769009590148926, 0.11244110763072968, 0.11719211935997009, 0.12194312363862991, 0.12669412791728973, 0.13144513964653015, 0.13619615137577057, 0.140947163105011, 0.1456981599330902, 0.15044917166233063, 0.15520018339157104, 0.15995118021965027, 0.16470219194889069, 0.1694532036781311]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 3.0, 6.0, 16.0, 4.0, 24.0, 32.0, 31.0, 45.0, 53.0, 58.0, 92.0, 127.0, 175.0, 296.0, 501.0, 873.0, 1879.0, 4333.0, 12012.0, 39153.0, 135355.0, 348186.0, 330049.0, 120945.0, 35224.0, 11093.0, 3884.0, 1753.0, 841.0, 513.0, 321.0, 189.0, 101.0, 75.0, 58.0, 63.0, 43.0, 25.0, 23.0, 22.0, 14.0, 17.0, 8.0, 5.0, 10.0, 2.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06842041015625, -0.0663442611694336, -0.06426811218261719, -0.06219196319580078, -0.060115814208984375, -0.05803966522216797, -0.05596351623535156, -0.053887367248535156, -0.05181121826171875, -0.049735069274902344, -0.04765892028808594, -0.04558277130126953, -0.043506622314453125, -0.04143047332763672, -0.03935432434082031, -0.037278175354003906, -0.0352020263671875, -0.033125877380371094, -0.031049728393554688, -0.02897357940673828, -0.026897430419921875, -0.02482128143310547, -0.022745132446289062, -0.020668983459472656, -0.01859283447265625, -0.016516685485839844, -0.014440536499023438, -0.012364387512207031, -0.010288238525390625, -0.008212089538574219, -0.0061359405517578125, -0.004059791564941406, -0.001983642578125, 9.250640869140625e-05, 0.0021686553955078125, 0.004244804382324219, 0.006320953369140625, 0.008397102355957031, 0.010473251342773438, 0.012549400329589844, 0.01462554931640625, 0.016701698303222656, 0.018777847290039062, 0.02085399627685547, 0.022930145263671875, 0.02500629425048828, 0.027082443237304688, 0.029158592224121094, 0.0312347412109375, 0.033310890197753906, 0.03538703918457031, 0.03746318817138672, 0.039539337158203125, 0.04161548614501953, 0.04369163513183594, 0.045767784118652344, 0.04784393310546875, 0.049920082092285156, 0.05199623107910156, 0.05407238006591797, 0.056148529052734375, 0.05822467803955078, 0.06030082702636719, 0.062376976013183594, 0.064453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 17.0, 24.0, 49.0, 77.0, 99.0, 113.0, 149.0, 138.0, 133.0, 77.0, 61.0, 31.0, 22.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.096435546875, -0.0937337875366211, -0.09103202819824219, -0.08833026885986328, -0.08562850952148438, -0.08292675018310547, -0.08022499084472656, -0.07752323150634766, -0.07482147216796875, -0.07211971282958984, -0.06941795349121094, -0.06671619415283203, -0.06401443481445312, -0.06131267547607422, -0.05861091613769531, -0.055909156799316406, -0.0532073974609375, -0.050505638122558594, -0.04780387878417969, -0.04510211944580078, -0.042400360107421875, -0.03969860076904297, -0.03699684143066406, -0.034295082092285156, -0.03159332275390625, -0.028891563415527344, -0.026189804077148438, -0.02348804473876953, -0.020786285400390625, -0.01808452606201172, -0.015382766723632812, -0.012681007385253906, -0.009979248046875, -0.007277488708496094, -0.0045757293701171875, -0.0018739700317382812, 0.000827789306640625, 0.0035295486450195312, 0.0062313079833984375, 0.008933067321777344, 0.01163482666015625, 0.014336585998535156, 0.017038345336914062, 0.01974010467529297, 0.022441864013671875, 0.02514362335205078, 0.027845382690429688, 0.030547142028808594, 0.0332489013671875, 0.035950660705566406, 0.03865242004394531, 0.04135417938232422, 0.044055938720703125, 0.04675769805908203, 0.04945945739746094, 0.052161216735839844, 0.05486297607421875, 0.057564735412597656, 0.06026649475097656, 0.06296825408935547, 0.06567001342773438, 0.06837177276611328, 0.07107353210449219, 0.0737752914428711, 0.07647705078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 4.0, 9.0, 7.0, 17.0, 17.0, 21.0, 21.0, 41.0, 42.0, 65.0, 90.0, 161.0, 225.0, 403.0, 745.0, 1488.0, 3011.0, 6515.0, 14350.0, 32621.0, 74614.0, 157575.0, 261607.0, 244527.0, 136976.0, 62532.0, 27344.0, 12274.0, 5517.0, 2656.0, 1338.0, 687.0, 362.0, 220.0, 145.0, 82.0, 56.0, 45.0, 34.0, 21.0, 15.0, 15.0, 18.0, 13.0, 11.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0380859375, -0.03685331344604492, -0.035620689392089844, -0.034388065338134766, -0.03315544128417969, -0.03192281723022461, -0.03069019317626953, -0.029457569122314453, -0.028224945068359375, -0.026992321014404297, -0.02575969696044922, -0.02452707290649414, -0.023294448852539062, -0.022061824798583984, -0.020829200744628906, -0.019596576690673828, -0.01836395263671875, -0.017131328582763672, -0.015898704528808594, -0.014666080474853516, -0.013433456420898438, -0.01220083236694336, -0.010968208312988281, -0.009735584259033203, -0.008502960205078125, -0.007270336151123047, -0.006037712097167969, -0.004805088043212891, -0.0035724639892578125, -0.0023398399353027344, -0.0011072158813476562, 0.00012540817260742188, 0.0013580322265625, 0.002590656280517578, 0.0038232803344726562, 0.005055904388427734, 0.0062885284423828125, 0.007521152496337891, 0.008753776550292969, 0.009986400604248047, 0.011219024658203125, 0.012451648712158203, 0.013684272766113281, 0.01491689682006836, 0.016149520874023438, 0.017382144927978516, 0.018614768981933594, 0.019847393035888672, 0.02108001708984375, 0.022312641143798828, 0.023545265197753906, 0.024777889251708984, 0.026010513305664062, 0.02724313735961914, 0.02847576141357422, 0.029708385467529297, 0.030941009521484375, 0.03217363357543945, 0.03340625762939453, 0.03463888168334961, 0.03587150573730469, 0.037104129791259766, 0.038336753845214844, 0.03956937789916992, 0.040802001953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 8.0, 11.0, 5.0, 16.0, 12.0, 14.0, 19.0, 19.0, 14.0, 20.0, 24.0, 25.0, 30.0, 39.0, 36.0, 32.0, 30.0, 56.0, 40.0, 32.0, 41.0, 29.0, 34.0, 37.0, 35.0, 42.0, 30.0, 29.0, 27.0, 26.0, 31.0, 20.0, 19.0, 15.0, 10.0, 11.0, 15.0, 12.0, 10.0, 8.0, 6.0, 2.0, 5.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06195068359375, -0.06004047393798828, -0.05813026428222656, -0.056220054626464844, -0.054309844970703125, -0.052399635314941406, -0.05048942565917969, -0.04857921600341797, -0.04666900634765625, -0.04475879669189453, -0.04284858703613281, -0.040938377380371094, -0.039028167724609375, -0.037117958068847656, -0.03520774841308594, -0.03329753875732422, -0.0313873291015625, -0.02947711944580078, -0.027566909790039062, -0.025656700134277344, -0.023746490478515625, -0.021836280822753906, -0.019926071166992188, -0.01801586151123047, -0.01610565185546875, -0.014195442199707031, -0.012285232543945312, -0.010375022888183594, -0.008464813232421875, -0.006554603576660156, -0.0046443939208984375, -0.0027341842651367188, -0.000823974609375, 0.0010862350463867188, 0.0029964447021484375, 0.004906654357910156, 0.006816864013671875, 0.008727073669433594, 0.010637283325195312, 0.012547492980957031, 0.01445770263671875, 0.01636791229248047, 0.018278121948242188, 0.020188331604003906, 0.022098541259765625, 0.024008750915527344, 0.025918960571289062, 0.02782917022705078, 0.0297393798828125, 0.03164958953857422, 0.03355979919433594, 0.035470008850097656, 0.037380218505859375, 0.039290428161621094, 0.04120063781738281, 0.04311084747314453, 0.04502105712890625, 0.04693126678466797, 0.04884147644042969, 0.050751686096191406, 0.052661895751953125, 0.054572105407714844, 0.05648231506347656, 0.05839252471923828, 0.060302734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 7.0, 5.0, 6.0, 13.0, 18.0, 21.0, 30.0, 55.0, 109.0, 183.0, 318.0, 647.0, 1600.0, 4437.0, 13207.0, 43534.0, 132599.0, 290820.0, 316926.0, 162261.0, 55858.0, 16913.0, 5372.0, 1922.0, 825.0, 389.0, 205.0, 89.0, 46.0, 50.0, 25.0, 19.0, 16.0, 10.0, 1.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0200042724609375, -0.01945018768310547, -0.018896102905273438, -0.018342018127441406, -0.017787933349609375, -0.017233848571777344, -0.016679763793945312, -0.01612567901611328, -0.01557159423828125, -0.015017509460449219, -0.014463424682617188, -0.013909339904785156, -0.013355255126953125, -0.012801170349121094, -0.012247085571289062, -0.011693000793457031, -0.011138916015625, -0.010584831237792969, -0.010030746459960938, -0.009476661682128906, -0.008922576904296875, -0.008368492126464844, -0.007814407348632812, -0.007260322570800781, -0.00670623779296875, -0.006152153015136719, -0.0055980682373046875, -0.005043983459472656, -0.004489898681640625, -0.003935813903808594, -0.0033817291259765625, -0.0028276443481445312, -0.0022735595703125, -0.0017194747924804688, -0.0011653900146484375, -0.0006113052368164062, -5.7220458984375e-05, 0.0004968643188476562, 0.0010509490966796875, 0.0016050338745117188, 0.00215911865234375, 0.0027132034301757812, 0.0032672882080078125, 0.0038213729858398438, 0.004375457763671875, 0.004929542541503906, 0.0054836273193359375, 0.006037712097167969, 0.006591796875, 0.007145881652832031, 0.0076999664306640625, 0.008254051208496094, 0.008808135986328125, 0.009362220764160156, 0.009916305541992188, 0.010470390319824219, 0.01102447509765625, 0.011578559875488281, 0.012132644653320312, 0.012686729431152344, 0.013240814208984375, 0.013794898986816406, 0.014348983764648438, 0.014903068542480469, 0.0154571533203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 7.0, 7.0, 3.0, 10.0, 5.0, 17.0, 13.0, 15.0, 27.0, 12.0, 21.0, 16.0, 24.0, 35.0, 15.0, 49.0, 26.0, 31.0, 49.0, 39.0, 55.0, 26.0, 52.0, 33.0, 43.0, 47.0, 34.0, 40.0, 26.0, 25.0, 30.0, 12.0, 33.0, 18.0, 11.0, 16.0, 10.0, 15.0, 8.0, 8.0, 8.0, 5.0, 7.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-5.0067901611328125e-06, -4.863366484642029e-06, -4.719942808151245e-06, -4.5765191316604614e-06, -4.433095455169678e-06, -4.289671778678894e-06, -4.14624810218811e-06, -4.002824425697327e-06, -3.859400749206543e-06, -3.7159770727157593e-06, -3.5725533962249756e-06, -3.429129719734192e-06, -3.285706043243408e-06, -3.1422823667526245e-06, -2.998858690261841e-06, -2.855435013771057e-06, -2.7120113372802734e-06, -2.5685876607894897e-06, -2.425163984298706e-06, -2.2817403078079224e-06, -2.1383166313171387e-06, -1.994892954826355e-06, -1.8514692783355713e-06, -1.7080456018447876e-06, -1.564621925354004e-06, -1.4211982488632202e-06, -1.2777745723724365e-06, -1.1343508958816528e-06, -9.909272193908691e-07, -8.475035429000854e-07, -7.040798664093018e-07, -5.606561899185181e-07, -4.172325134277344e-07, -2.738088369369507e-07, -1.30385160446167e-07, 1.30385160446167e-08, 1.564621925354004e-07, 2.998858690261841e-07, 4.4330954551696777e-07, 5.867332220077515e-07, 7.301568984985352e-07, 8.735805749893188e-07, 1.0170042514801025e-06, 1.1604279279708862e-06, 1.30385160446167e-06, 1.4472752809524536e-06, 1.5906989574432373e-06, 1.734122633934021e-06, 1.8775463104248047e-06, 2.0209699869155884e-06, 2.164393663406372e-06, 2.3078173398971558e-06, 2.4512410163879395e-06, 2.594664692878723e-06, 2.738088369369507e-06, 2.8815120458602905e-06, 3.0249357223510742e-06, 3.168359398841858e-06, 3.3117830753326416e-06, 3.4552067518234253e-06, 3.598630428314209e-06, 3.7420541048049927e-06, 3.885477781295776e-06, 4.02890145778656e-06, 4.172325134277344e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 7.0, 9.0, 8.0, 19.0, 29.0, 76.0, 102.0, 174.0, 325.0, 582.0, 1058.0, 2376.0, 6016.0, 16890.0, 50487.0, 136452.0, 276800.0, 298063.0, 162730.0, 62417.0, 21020.0, 7336.0, 2899.0, 1205.0, 637.0, 352.0, 227.0, 100.0, 74.0, 33.0, 27.0, 12.0, 2.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015899658203125, -0.015290498733520508, -0.014681339263916016, -0.014072179794311523, -0.013463020324707031, -0.012853860855102539, -0.012244701385498047, -0.011635541915893555, -0.011026382446289062, -0.01041722297668457, -0.009808063507080078, -0.009198904037475586, -0.008589744567871094, -0.007980585098266602, -0.007371425628662109, -0.006762266159057617, -0.006153106689453125, -0.005543947219848633, -0.004934787750244141, -0.0043256282806396484, -0.0037164688110351562, -0.003107309341430664, -0.002498149871826172, -0.0018889904022216797, -0.0012798309326171875, -0.0006706714630126953, -6.151199340820312e-05, 0.0005476474761962891, 0.0011568069458007812, 0.0017659664154052734, 0.0023751258850097656, 0.002984285354614258, 0.00359344482421875, 0.004202604293823242, 0.004811763763427734, 0.0054209232330322266, 0.006030082702636719, 0.006639242172241211, 0.007248401641845703, 0.007857561111450195, 0.008466720581054688, 0.00907588005065918, 0.009685039520263672, 0.010294198989868164, 0.010903358459472656, 0.011512517929077148, 0.01212167739868164, 0.012730836868286133, 0.013339996337890625, 0.013949155807495117, 0.01455831527709961, 0.015167474746704102, 0.015776634216308594, 0.016385793685913086, 0.016994953155517578, 0.01760411262512207, 0.018213272094726562, 0.018822431564331055, 0.019431591033935547, 0.02004075050354004, 0.02064990997314453, 0.021259069442749023, 0.021868228912353516, 0.022477388381958008, 0.0230865478515625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 9.0, 15.0, 9.0, 18.0, 13.0, 16.0, 15.0, 25.0, 22.0, 26.0, 28.0, 25.0, 32.0, 44.0, 37.0, 48.0, 44.0, 45.0, 54.0, 47.0, 52.0, 45.0, 36.0, 41.0, 28.0, 38.0, 23.0, 29.0, 25.0, 14.0, 17.0, 16.0, 9.0, 7.0, 3.0, 7.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0108489990234375, -0.010486841201782227, -0.010124683380126953, -0.00976252555847168, -0.009400367736816406, -0.009038209915161133, -0.00867605209350586, -0.008313894271850586, -0.007951736450195312, -0.007589578628540039, -0.007227420806884766, -0.006865262985229492, -0.006503105163574219, -0.006140947341918945, -0.005778789520263672, -0.0054166316986083984, -0.005054473876953125, -0.0046923160552978516, -0.004330158233642578, -0.003968000411987305, -0.0036058425903320312, -0.003243684768676758, -0.0028815269470214844, -0.002519369125366211, -0.0021572113037109375, -0.001795053482055664, -0.0014328956604003906, -0.0010707378387451172, -0.0007085800170898438, -0.0003464221954345703, 1.5735626220703125e-05, 0.00037789344787597656, 0.00074005126953125, 0.0011022090911865234, 0.0014643669128417969, 0.0018265247344970703, 0.0021886825561523438, 0.002550840377807617, 0.0029129981994628906, 0.003275156021118164, 0.0036373138427734375, 0.003999471664428711, 0.004361629486083984, 0.004723787307739258, 0.005085945129394531, 0.005448102951049805, 0.005810260772705078, 0.0061724185943603516, 0.006534576416015625, 0.0068967342376708984, 0.007258892059326172, 0.007621049880981445, 0.007983207702636719, 0.008345365524291992, 0.008707523345947266, 0.009069681167602539, 0.009431838989257812, 0.009793996810913086, 0.01015615463256836, 0.010518312454223633, 0.010880470275878906, 0.01124262809753418, 0.011604785919189453, 0.011966943740844727, 0.0123291015625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 39.0, 219.0, 441.0, 239.0, 45.0, 11.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1452641487121582, -1.1181871891021729, -1.091110348701477, -1.0640333890914917, -1.036956548690796, -1.0098795890808105, -0.98280268907547, -0.9557257890701294, -0.9286488890647888, -0.9015719890594482, -0.8744950890541077, -0.8474181890487671, -0.8203412294387817, -0.7932643294334412, -0.7661874294281006, -0.73911052942276, -0.7120336294174194, -0.6849567294120789, -0.6578798294067383, -0.6308028697967529, -0.6037259697914124, -0.5766490697860718, -0.5495721697807312, -0.5224952697753906, -0.4954183101654053, -0.4683414101600647, -0.44126448035240173, -0.41418758034706116, -0.3871106803417206, -0.3600337505340576, -0.33295685052871704, -0.30587995052337646, -0.2788030505180359, -0.2517261505126953, -0.22464923560619354, -0.19757232069969177, -0.1704954206943512, -0.14341850578784943, -0.11634159088134766, -0.08926469087600708, -0.06218777596950531, -0.03511086851358414, -0.008033957332372665, 0.019042953848838806, 0.04611986130475998, 0.07319676876068115, 0.10027368366718292, 0.1273505836725235, 0.15442749857902527, 0.18150441348552704, 0.20858131349086761, 0.23565822839736938, 0.26273512840270996, 0.28981202840805054, 0.3168889582157135, 0.3439658582210541, 0.37104278802871704, 0.3981196880340576, 0.4251966178417206, 0.45227351784706116, 0.47935041785240173, 0.5064273476600647, 0.5335042476654053, 0.5605811476707458, 0.5876580476760864]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 8.0, 8.0, 9.0, 15.0, 13.0, 19.0, 17.0, 22.0, 21.0, 40.0, 41.0, 35.0, 44.0, 48.0, 33.0, 48.0, 44.0, 40.0, 41.0, 34.0, 46.0, 44.0, 41.0, 30.0, 36.0, 27.0, 31.0, 20.0, 19.0, 16.0, 16.0, 14.0, 21.0, 9.0, 4.0, 7.0, 9.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1647854447364807, -0.15922793745994568, -0.15367043018341064, -0.1481129229068756, -0.14255543053150177, -0.13699792325496674, -0.1314404159784317, -0.12588290870189667, -0.12032540887594223, -0.1147679015994072, -0.10921040177345276, -0.10365289449691772, -0.09809538722038269, -0.09253788739442825, -0.08698038011789322, -0.08142288029193878, -0.07586537301540375, -0.07030786573886871, -0.06475036591291428, -0.05919285863637924, -0.053635355085134506, -0.04807785153388977, -0.042520344257354736, -0.03696284070611, -0.031405337154865265, -0.02584783360362053, -0.020290328189730644, -0.01473282277584076, -0.009175319224596024, -0.003617815673351288, 0.0019396916031837463, 0.007497195154428482, 0.013054698705673218, 0.018612202256917953, 0.02416970767080784, 0.029727213084697723, 0.03528471663594246, 0.040842220187187195, 0.04639972746372223, 0.051957231014966965, 0.0575147345662117, 0.06307224184274673, 0.06862974166870117, 0.0741872489452362, 0.07974475622177124, 0.08530225604772568, 0.09085976332426071, 0.09641726315021515, 0.10197477042675018, 0.10753227770328522, 0.11308977752923965, 0.11864728480577469, 0.12420478463172913, 0.12976229190826416, 0.1353197991847992, 0.14087730646133423, 0.14643481373786926, 0.1519923210144043, 0.15754982829093933, 0.16310733556747437, 0.1686648279428482, 0.17422233521938324, 0.17977984249591827, 0.1853373497724533, 0.19089484214782715]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 3.0, 3.0, 8.0, 13.0, 21.0, 33.0, 44.0, 70.0, 113.0, 189.0, 366.0, 846.0, 2369.0, 7410.0, 27299.0, 202924.0, 2216305.0, 1576315.0, 129590.0, 21196.0, 5783.0, 2034.0, 735.0, 293.0, 140.0, 76.0, 37.0, 27.0, 15.0, 14.0, 8.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0760498046875, -0.0738067626953125, -0.071563720703125, -0.0693206787109375, -0.06707763671875, -0.0648345947265625, -0.062591552734375, -0.0603485107421875, -0.05810546875, -0.0558624267578125, -0.053619384765625, -0.0513763427734375, -0.04913330078125, -0.0468902587890625, -0.044647216796875, -0.0424041748046875, -0.0401611328125, -0.0379180908203125, -0.035675048828125, -0.0334320068359375, -0.03118896484375, -0.0289459228515625, -0.026702880859375, -0.0244598388671875, -0.022216796875, -0.0199737548828125, -0.017730712890625, -0.0154876708984375, -0.01324462890625, -0.0110015869140625, -0.008758544921875, -0.0065155029296875, -0.0042724609375, -0.0020294189453125, 0.000213623046875, 0.0024566650390625, 0.00469970703125, 0.0069427490234375, 0.009185791015625, 0.0114288330078125, 0.013671875, 0.0159149169921875, 0.018157958984375, 0.0204010009765625, 0.02264404296875, 0.0248870849609375, 0.027130126953125, 0.0293731689453125, 0.0316162109375, 0.0338592529296875, 0.036102294921875, 0.0383453369140625, 0.04058837890625, 0.0428314208984375, 0.045074462890625, 0.0473175048828125, 0.049560546875, 0.0518035888671875, 0.054046630859375, 0.0562896728515625, 0.05853271484375, 0.0607757568359375, 0.063018798828125, 0.0652618408203125, 0.0675048828125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 12.0, 25.0, 40.0, 70.0, 80.0, 117.0, 133.0, 132.0, 115.0, 96.0, 66.0, 58.0, 31.0, 15.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0860595703125, -0.0835428237915039, -0.08102607727050781, -0.07850933074951172, -0.07599258422851562, -0.07347583770751953, -0.07095909118652344, -0.06844234466552734, -0.06592559814453125, -0.06340885162353516, -0.06089210510253906, -0.05837535858154297, -0.055858612060546875, -0.05334186553955078, -0.05082511901855469, -0.048308372497558594, -0.0457916259765625, -0.043274879455566406, -0.04075813293457031, -0.03824138641357422, -0.035724639892578125, -0.03320789337158203, -0.030691146850585938, -0.028174400329589844, -0.02565765380859375, -0.023140907287597656, -0.020624160766601562, -0.01810741424560547, -0.015590667724609375, -0.013073921203613281, -0.010557174682617188, -0.008040428161621094, -0.005523681640625, -0.0030069351196289062, -0.0004901885986328125, 0.0020265579223632812, 0.004543304443359375, 0.007060050964355469, 0.009576797485351562, 0.012093544006347656, 0.01461029052734375, 0.017127037048339844, 0.019643783569335938, 0.02216053009033203, 0.024677276611328125, 0.02719402313232422, 0.029710769653320312, 0.032227516174316406, 0.0347442626953125, 0.037261009216308594, 0.03977775573730469, 0.04229450225830078, 0.044811248779296875, 0.04732799530029297, 0.04984474182128906, 0.052361488342285156, 0.05487823486328125, 0.057394981384277344, 0.05991172790527344, 0.06242847442626953, 0.06494522094726562, 0.06746196746826172, 0.06997871398925781, 0.0724954605102539, 0.07501220703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 6.0, 8.0, 10.0, 23.0, 29.0, 44.0, 67.0, 119.0, 180.0, 281.0, 553.0, 1490.0, 6921.0, 55016.0, 1015391.0, 2951844.0, 143816.0, 14305.0, 2544.0, 754.0, 340.0, 192.0, 122.0, 68.0, 49.0, 37.0, 25.0, 15.0, 11.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.07860279083251953, -0.07560157775878906, -0.0726003646850586, -0.06959915161132812, -0.06659793853759766, -0.06359672546386719, -0.06059551239013672, -0.05759429931640625, -0.05459308624267578, -0.05159187316894531, -0.048590660095214844, -0.045589447021484375, -0.042588233947753906, -0.03958702087402344, -0.03658580780029297, -0.0335845947265625, -0.03058338165283203, -0.027582168579101562, -0.024580955505371094, -0.021579742431640625, -0.018578529357910156, -0.015577316284179688, -0.012576103210449219, -0.00957489013671875, -0.006573677062988281, -0.0035724639892578125, -0.0005712509155273438, 0.002429962158203125, 0.005431175231933594, 0.008432388305664062, 0.011433601379394531, 0.014434814453125, 0.01743602752685547, 0.020437240600585938, 0.023438453674316406, 0.026439666748046875, 0.029440879821777344, 0.03244209289550781, 0.03544330596923828, 0.03844451904296875, 0.04144573211669922, 0.04444694519042969, 0.047448158264160156, 0.050449371337890625, 0.053450584411621094, 0.05645179748535156, 0.05945301055908203, 0.0624542236328125, 0.06545543670654297, 0.06845664978027344, 0.0714578628540039, 0.07445907592773438, 0.07746028900146484, 0.08046150207519531, 0.08346271514892578, 0.08646392822265625, 0.08946514129638672, 0.09246635437011719, 0.09546756744384766, 0.09846878051757812, 0.1014699935913086, 0.10447120666503906, 0.10747241973876953, 0.1104736328125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 6.0, 9.0, 11.0, 7.0, 10.0, 14.0, 20.0, 30.0, 40.0, 47.0, 51.0, 75.0, 86.0, 133.0, 186.0, 230.0, 315.0, 514.0, 477.0, 460.0, 349.0, 280.0, 185.0, 131.0, 83.0, 77.0, 54.0, 51.0, 34.0, 22.0, 23.0, 18.0, 10.0, 11.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.044830322265625, -0.04349374771118164, -0.04215717315673828, -0.04082059860229492, -0.03948402404785156, -0.0381474494934082, -0.036810874938964844, -0.035474300384521484, -0.034137725830078125, -0.032801151275634766, -0.031464576721191406, -0.030128002166748047, -0.028791427612304688, -0.027454853057861328, -0.02611827850341797, -0.02478170394897461, -0.02344512939453125, -0.02210855484008789, -0.02077198028564453, -0.019435405731201172, -0.018098831176757812, -0.016762256622314453, -0.015425682067871094, -0.014089107513427734, -0.012752532958984375, -0.011415958404541016, -0.010079383850097656, -0.008742809295654297, -0.0074062347412109375, -0.006069660186767578, -0.004733085632324219, -0.0033965110778808594, -0.0020599365234375, -0.0007233619689941406, 0.0006132125854492188, 0.0019497871398925781, 0.0032863616943359375, 0.004622936248779297, 0.005959510803222656, 0.007296085357666016, 0.008632659912109375, 0.009969234466552734, 0.011305809020996094, 0.012642383575439453, 0.013978958129882812, 0.015315532684326172, 0.01665210723876953, 0.01798868179321289, 0.01932525634765625, 0.02066183090209961, 0.02199840545654297, 0.023334980010986328, 0.024671554565429688, 0.026008129119873047, 0.027344703674316406, 0.028681278228759766, 0.030017852783203125, 0.031354427337646484, 0.032691001892089844, 0.0340275764465332, 0.03536415100097656, 0.03670072555541992, 0.03803730010986328, 0.03937387466430664, 0.04071044921875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 10.0, 7.0, 17.0, 40.0, 52.0, 94.0, 104.0, 143.0, 142.0, 136.0, 101.0, 65.0, 51.0, 18.0, 14.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3541611433029175, -0.3428930640220642, -0.33162498474121094, -0.32035690546035767, -0.3090888261795044, -0.2978207468986511, -0.28655266761779785, -0.2752845883369446, -0.2640165090560913, -0.25274842977523804, -0.24148035049438477, -0.2302122712135315, -0.21894419193267822, -0.20767611265182495, -0.19640803337097168, -0.1851399540901184, -0.17387187480926514, -0.16260379552841187, -0.1513357162475586, -0.14006763696670532, -0.12879955768585205, -0.11753147840499878, -0.10626339912414551, -0.09499531984329224, -0.08372724056243896, -0.0724591612815857, -0.06119108200073242, -0.04992300271987915, -0.03865492343902588, -0.027386844158172607, -0.016118764877319336, -0.0048506855964660645, 0.006417393684387207, 0.01768547296524048, 0.02895355224609375, 0.04022163152694702, 0.05148971080780029, 0.06275779008865356, 0.07402586936950684, 0.08529394865036011, 0.09656202793121338, 0.10783010721206665, 0.11909818649291992, 0.1303662657737732, 0.14163434505462646, 0.15290242433547974, 0.164170503616333, 0.17543858289718628, 0.18670666217803955, 0.19797474145889282, 0.2092428207397461, 0.22051090002059937, 0.23177897930145264, 0.2430470585823059, 0.2543151378631592, 0.26558321714401245, 0.2768512964248657, 0.288119375705719, 0.29938745498657227, 0.31065553426742554, 0.3219236135482788, 0.3331916928291321, 0.34445977210998535, 0.3557278513908386, 0.3669959306716919]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 10.0, 7.0, 15.0, 10.0, 13.0, 12.0, 13.0, 14.0, 19.0, 16.0, 26.0, 30.0, 40.0, 33.0, 33.0, 37.0, 36.0, 32.0, 40.0, 45.0, 45.0, 32.0, 37.0, 37.0, 34.0, 42.0, 24.0, 43.0, 30.0, 27.0, 22.0, 20.0, 15.0, 17.0, 15.0, 14.0, 9.0, 11.0, 8.0, 5.0, 4.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1225472092628479, -0.11832526326179504, -0.11410331726074219, -0.10988137125968933, -0.10565942525863647, -0.10143747925758362, -0.09721552580595016, -0.09299357980489731, -0.08877163380384445, -0.0845496878027916, -0.08032774180173874, -0.07610579580068588, -0.07188384234905243, -0.06766189634799957, -0.06343995034694672, -0.05921800434589386, -0.054996058344841, -0.05077411234378815, -0.04655216634273529, -0.042330216616392136, -0.03810827061533928, -0.03388632461428642, -0.029664376750588417, -0.02544242888689041, -0.021220482885837555, -0.0169985368847847, -0.012776589021086693, -0.008554642088711262, -0.004332695156335831, -0.00011074915528297424, 0.004111198708415031, 0.008333146572113037, 0.012555092573165894, 0.01677703857421875, 0.020998986437916756, 0.02522093430161476, 0.029442880302667618, 0.033664826303720474, 0.03788677603006363, 0.042108722031116486, 0.04633066803216934, 0.0505526140332222, 0.054774560034275055, 0.05899650976061821, 0.06321845948696136, 0.06744040548801422, 0.07166235148906708, 0.07588429749011993, 0.08010624349117279, 0.08432818949222565, 0.0885501354932785, 0.09277208149433136, 0.09699402749538422, 0.10121597349643707, 0.10543792694807053, 0.10965987294912338, 0.11388181895017624, 0.1181037649512291, 0.12232571095228195, 0.1265476644039154, 0.13076961040496826, 0.13499155640602112, 0.13921350240707397, 0.14343544840812683, 0.1476573944091797]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 12.0, 16.0, 22.0, 23.0, 41.0, 25.0, 67.0, 81.0, 121.0, 132.0, 202.0, 313.0, 577.0, 1064.0, 2244.0, 5456.0, 16230.0, 51940.0, 166646.0, 378577.0, 281477.0, 96842.0, 29726.0, 9567.0, 3510.0, 1523.0, 773.0, 420.0, 296.0, 162.0, 115.0, 82.0, 54.0, 60.0, 32.0, 22.0, 20.0, 16.0, 16.0, 9.0, 7.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.0721435546875, -0.06994152069091797, -0.06773948669433594, -0.0655374526977539, -0.06333541870117188, -0.061133384704589844, -0.05893135070800781, -0.05672931671142578, -0.05452728271484375, -0.05232524871826172, -0.05012321472167969, -0.047921180725097656, -0.045719146728515625, -0.043517112731933594, -0.04131507873535156, -0.03911304473876953, -0.0369110107421875, -0.03470897674560547, -0.03250694274902344, -0.030304908752441406, -0.028102874755859375, -0.025900840759277344, -0.023698806762695312, -0.02149677276611328, -0.01929473876953125, -0.01709270477294922, -0.014890670776367188, -0.012688636779785156, -0.010486602783203125, -0.008284568786621094, -0.0060825347900390625, -0.0038805007934570312, -0.001678466796875, 0.0005235671997070312, 0.0027256011962890625, 0.004927635192871094, 0.007129669189453125, 0.009331703186035156, 0.011533737182617188, 0.013735771179199219, 0.01593780517578125, 0.01813983917236328, 0.020341873168945312, 0.022543907165527344, 0.024745941162109375, 0.026947975158691406, 0.029150009155273438, 0.03135204315185547, 0.0335540771484375, 0.03575611114501953, 0.03795814514160156, 0.040160179138183594, 0.042362213134765625, 0.044564247131347656, 0.04676628112792969, 0.04896831512451172, 0.05117034912109375, 0.05337238311767578, 0.05557441711425781, 0.057776451110839844, 0.059978485107421875, 0.062180519104003906, 0.06438255310058594, 0.06658458709716797, 0.06878662109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 21.0, 22.0, 38.0, 80.0, 108.0, 131.0, 143.0, 132.0, 102.0, 88.0, 63.0, 32.0, 21.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08795166015625, -0.08533668518066406, -0.08272171020507812, -0.08010673522949219, -0.07749176025390625, -0.07487678527832031, -0.07226181030273438, -0.06964683532714844, -0.0670318603515625, -0.06441688537597656, -0.061801910400390625, -0.05918693542480469, -0.05657196044921875, -0.05395698547363281, -0.051342010498046875, -0.04872703552246094, -0.046112060546875, -0.04349708557128906, -0.040882110595703125, -0.03826713562011719, -0.03565216064453125, -0.03303718566894531, -0.030422210693359375, -0.027807235717773438, -0.0251922607421875, -0.022577285766601562, -0.019962310791015625, -0.017347335815429688, -0.01473236083984375, -0.012117385864257812, -0.009502410888671875, -0.0068874359130859375, -0.0042724609375, -0.0016574859619140625, 0.000957489013671875, 0.0035724639892578125, 0.00618743896484375, 0.008802413940429688, 0.011417388916015625, 0.014032363891601562, 0.0166473388671875, 0.019262313842773438, 0.021877288818359375, 0.024492263793945312, 0.02710723876953125, 0.029722213745117188, 0.032337188720703125, 0.03495216369628906, 0.037567138671875, 0.04018211364746094, 0.042797088623046875, 0.04541206359863281, 0.04802703857421875, 0.05064201354980469, 0.053256988525390625, 0.05587196350097656, 0.0584869384765625, 0.06110191345214844, 0.06371688842773438, 0.06633186340332031, 0.06894683837890625, 0.07156181335449219, 0.07417678833007812, 0.07679176330566406, 0.07940673828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 13.0, 9.0, 20.0, 39.0, 49.0, 97.0, 133.0, 243.0, 377.0, 697.0, 1332.0, 2756.0, 6374.0, 16960.0, 49544.0, 154855.0, 385020.0, 285471.0, 94482.0, 30598.0, 10772.0, 4322.0, 2039.0, 974.0, 564.0, 310.0, 183.0, 124.0, 71.0, 40.0, 27.0, 17.0, 8.0, 12.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.06884765625, -0.06686830520629883, -0.06488895416259766, -0.06290960311889648, -0.06093025207519531, -0.05895090103149414, -0.05697154998779297, -0.0549921989440918, -0.053012847900390625, -0.05103349685668945, -0.04905414581298828, -0.04707479476928711, -0.04509544372558594, -0.043116092681884766, -0.041136741638183594, -0.03915739059448242, -0.03717803955078125, -0.03519868850708008, -0.033219337463378906, -0.031239986419677734, -0.029260635375976562, -0.02728128433227539, -0.02530193328857422, -0.023322582244873047, -0.021343231201171875, -0.019363880157470703, -0.01738452911376953, -0.01540517807006836, -0.013425827026367188, -0.011446475982666016, -0.009467124938964844, -0.007487773895263672, -0.0055084228515625, -0.003529071807861328, -0.0015497207641601562, 0.0004296302795410156, 0.0024089813232421875, 0.004388332366943359, 0.006367683410644531, 0.008347034454345703, 0.010326385498046875, 0.012305736541748047, 0.014285087585449219, 0.01626443862915039, 0.018243789672851562, 0.020223140716552734, 0.022202491760253906, 0.024181842803955078, 0.02616119384765625, 0.028140544891357422, 0.030119895935058594, 0.032099246978759766, 0.03407859802246094, 0.03605794906616211, 0.03803730010986328, 0.04001665115356445, 0.041996002197265625, 0.0439753532409668, 0.04595470428466797, 0.04793405532836914, 0.04991340637207031, 0.051892757415771484, 0.053872108459472656, 0.05585145950317383, 0.057830810546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 9.0, 6.0, 7.0, 12.0, 9.0, 10.0, 23.0, 18.0, 17.0, 28.0, 34.0, 35.0, 32.0, 53.0, 38.0, 49.0, 45.0, 39.0, 41.0, 40.0, 46.0, 39.0, 32.0, 30.0, 23.0, 42.0, 31.0, 29.0, 26.0, 25.0, 30.0, 14.0, 14.0, 11.0, 13.0, 7.0, 8.0, 10.0, 5.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0628662109375, -0.060699462890625, -0.05853271484375, -0.056365966796875, -0.05419921875, -0.052032470703125, -0.04986572265625, -0.047698974609375, -0.0455322265625, -0.043365478515625, -0.04119873046875, -0.039031982421875, -0.036865234375, -0.034698486328125, -0.03253173828125, -0.030364990234375, -0.0281982421875, -0.026031494140625, -0.02386474609375, -0.021697998046875, -0.01953125, -0.017364501953125, -0.01519775390625, -0.013031005859375, -0.0108642578125, -0.008697509765625, -0.00653076171875, -0.004364013671875, -0.002197265625, -3.0517578125e-05, 0.00213623046875, 0.004302978515625, 0.0064697265625, 0.008636474609375, 0.01080322265625, 0.012969970703125, 0.01513671875, 0.017303466796875, 0.01947021484375, 0.021636962890625, 0.0238037109375, 0.025970458984375, 0.02813720703125, 0.030303955078125, 0.032470703125, 0.034637451171875, 0.03680419921875, 0.038970947265625, 0.0411376953125, 0.043304443359375, 0.04547119140625, 0.047637939453125, 0.0498046875, 0.051971435546875, 0.05413818359375, 0.056304931640625, 0.0584716796875, 0.060638427734375, 0.06280517578125, 0.064971923828125, 0.067138671875, 0.069305419921875, 0.07147216796875, 0.073638916015625, 0.0758056640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 10.0, 9.0, 16.0, 22.0, 22.0, 25.0, 47.0, 61.0, 110.0, 165.0, 328.0, 653.0, 1485.0, 3553.0, 9136.0, 22612.0, 55400.0, 125343.0, 249099.0, 287417.0, 165295.0, 74944.0, 31467.0, 12518.0, 4871.0, 2067.0, 880.0, 411.0, 207.0, 119.0, 70.0, 50.0, 33.0, 28.0, 22.0, 15.0, 12.0, 11.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01496124267578125, -0.014481425285339355, -0.014001607894897461, -0.013521790504455566, -0.013041973114013672, -0.012562155723571777, -0.012082338333129883, -0.011602520942687988, -0.011122703552246094, -0.0106428861618042, -0.010163068771362305, -0.00968325138092041, -0.009203433990478516, -0.008723616600036621, -0.008243799209594727, -0.007763981819152832, -0.0072841644287109375, -0.006804347038269043, -0.0063245296478271484, -0.005844712257385254, -0.005364894866943359, -0.004885077476501465, -0.00440526008605957, -0.003925442695617676, -0.0034456253051757812, -0.0029658079147338867, -0.002485990524291992, -0.0020061731338500977, -0.0015263557434082031, -0.0010465383529663086, -0.0005667209625244141, -8.690357208251953e-05, 0.000392913818359375, 0.0008727312088012695, 0.001352548599243164, 0.0018323659896850586, 0.002312183380126953, 0.0027920007705688477, 0.003271818161010742, 0.0037516355514526367, 0.004231452941894531, 0.004711270332336426, 0.00519108772277832, 0.005670905113220215, 0.006150722503662109, 0.006630539894104004, 0.0071103572845458984, 0.007590174674987793, 0.008069992065429688, 0.008549809455871582, 0.009029626846313477, 0.009509444236755371, 0.009989261627197266, 0.01046907901763916, 0.010948896408081055, 0.01142871379852295, 0.011908531188964844, 0.012388348579406738, 0.012868165969848633, 0.013347983360290527, 0.013827800750732422, 0.014307618141174316, 0.014787435531616211, 0.015267252922058105, 0.0157470703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 6.0, 2.0, 7.0, 9.0, 8.0, 11.0, 17.0, 25.0, 21.0, 31.0, 45.0, 44.0, 72.0, 74.0, 64.0, 85.0, 87.0, 52.0, 63.0, 59.0, 59.0, 31.0, 26.0, 29.0, 28.0, 13.0, 9.0, 8.0, 10.0, 3.0, 3.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.285045623779297e-06, -8.005648851394653e-06, -7.72625207901001e-06, -7.446855306625366e-06, -7.167458534240723e-06, -6.888061761856079e-06, -6.6086649894714355e-06, -6.329268217086792e-06, -6.0498714447021484e-06, -5.770474672317505e-06, -5.491077899932861e-06, -5.211681127548218e-06, -4.932284355163574e-06, -4.652887582778931e-06, -4.373490810394287e-06, -4.0940940380096436e-06, -3.814697265625e-06, -3.5353004932403564e-06, -3.255903720855713e-06, -2.9765069484710693e-06, -2.6971101760864258e-06, -2.4177134037017822e-06, -2.1383166313171387e-06, -1.8589198589324951e-06, -1.5795230865478516e-06, -1.300126314163208e-06, -1.0207295417785645e-06, -7.413327693939209e-07, -4.6193599700927734e-07, -1.825392246246338e-07, 9.685754776000977e-08, 3.762543201446533e-07, 6.556510925292969e-07, 9.350478649139404e-07, 1.214444637298584e-06, 1.4938414096832275e-06, 1.773238182067871e-06, 2.0526349544525146e-06, 2.332031726837158e-06, 2.6114284992218018e-06, 2.8908252716064453e-06, 3.170222043991089e-06, 3.4496188163757324e-06, 3.729015588760376e-06, 4.0084123611450195e-06, 4.287809133529663e-06, 4.567205905914307e-06, 4.84660267829895e-06, 5.125999450683594e-06, 5.405396223068237e-06, 5.684792995452881e-06, 5.964189767837524e-06, 6.243586540222168e-06, 6.5229833126068115e-06, 6.802380084991455e-06, 7.081776857376099e-06, 7.361173629760742e-06, 7.640570402145386e-06, 7.91996717453003e-06, 8.199363946914673e-06, 8.478760719299316e-06, 8.75815749168396e-06, 9.037554264068604e-06, 9.316951036453247e-06, 9.59634780883789e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 10.0, 9.0, 9.0, 24.0, 21.0, 40.0, 62.0, 90.0, 162.0, 282.0, 476.0, 966.0, 1993.0, 4292.0, 10168.0, 24494.0, 58792.0, 132145.0, 241738.0, 267816.0, 168636.0, 78584.0, 33078.0, 13793.0, 5779.0, 2482.0, 1209.0, 577.0, 318.0, 178.0, 126.0, 68.0, 37.0, 34.0, 21.0, 17.0, 8.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0157623291015625, -0.015256643295288086, -0.014750957489013672, -0.014245271682739258, -0.013739585876464844, -0.01323390007019043, -0.012728214263916016, -0.012222528457641602, -0.011716842651367188, -0.011211156845092773, -0.01070547103881836, -0.010199785232543945, -0.009694099426269531, -0.009188413619995117, -0.008682727813720703, -0.008177042007446289, -0.007671356201171875, -0.007165670394897461, -0.006659984588623047, -0.006154298782348633, -0.005648612976074219, -0.005142927169799805, -0.004637241363525391, -0.0041315555572509766, -0.0036258697509765625, -0.0031201839447021484, -0.0026144981384277344, -0.0021088123321533203, -0.0016031265258789062, -0.0010974407196044922, -0.0005917549133300781, -8.606910705566406e-05, 0.00041961669921875, 0.0009253025054931641, 0.0014309883117675781, 0.0019366741180419922, 0.0024423599243164062, 0.0029480457305908203, 0.0034537315368652344, 0.0039594173431396484, 0.0044651031494140625, 0.0049707889556884766, 0.005476474761962891, 0.005982160568237305, 0.006487846374511719, 0.006993532180786133, 0.007499217987060547, 0.008004903793334961, 0.008510589599609375, 0.009016275405883789, 0.009521961212158203, 0.010027647018432617, 0.010533332824707031, 0.011039018630981445, 0.01154470443725586, 0.012050390243530273, 0.012556076049804688, 0.013061761856079102, 0.013567447662353516, 0.01407313346862793, 0.014578819274902344, 0.015084505081176758, 0.015590190887451172, 0.016095876693725586, 0.0166015625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 9.0, 9.0, 8.0, 9.0, 9.0, 14.0, 14.0, 19.0, 25.0, 32.0, 23.0, 39.0, 46.0, 51.0, 44.0, 49.0, 38.0, 59.0, 53.0, 62.0, 55.0, 53.0, 45.0, 38.0, 44.0, 32.0, 26.0, 15.0, 16.0, 14.0, 10.0, 9.0, 11.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.012176513671875, -0.011721372604370117, -0.011266231536865234, -0.010811090469360352, -0.010355949401855469, -0.009900808334350586, -0.009445667266845703, -0.00899052619934082, -0.008535385131835938, -0.008080244064331055, -0.007625102996826172, -0.007169961929321289, -0.006714820861816406, -0.0062596797943115234, -0.005804538726806641, -0.005349397659301758, -0.004894256591796875, -0.004439115524291992, -0.003983974456787109, -0.0035288333892822266, -0.0030736923217773438, -0.002618551254272461, -0.002163410186767578, -0.0017082691192626953, -0.0012531280517578125, -0.0007979869842529297, -0.0003428459167480469, 0.00011229515075683594, 0.0005674362182617188, 0.0010225772857666016, 0.0014777183532714844, 0.0019328594207763672, 0.00238800048828125, 0.002843141555786133, 0.0032982826232910156, 0.0037534236907958984, 0.004208564758300781, 0.004663705825805664, 0.005118846893310547, 0.00557398796081543, 0.0060291290283203125, 0.006484270095825195, 0.006939411163330078, 0.007394552230834961, 0.007849693298339844, 0.008304834365844727, 0.00875997543334961, 0.009215116500854492, 0.009670257568359375, 0.010125398635864258, 0.01058053970336914, 0.011035680770874023, 0.011490821838378906, 0.011945962905883789, 0.012401103973388672, 0.012856245040893555, 0.013311386108398438, 0.01376652717590332, 0.014221668243408203, 0.014676809310913086, 0.015131950378417969, 0.015587091445922852, 0.016042232513427734, 0.016497373580932617, 0.0169525146484375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 8.0, 11.0, 22.0, 54.0, 111.0, 170.0, 195.0, 179.0, 117.0, 73.0, 30.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5217850208282471, -0.509054958820343, -0.4963248670101166, -0.4835948050022125, -0.4708647131919861, -0.45813465118408203, -0.445404589176178, -0.43267449736595154, -0.4199444353580475, -0.40721437335014343, -0.394484281539917, -0.38175421953201294, -0.3690241277217865, -0.35629406571388245, -0.343563973903656, -0.33083391189575195, -0.3181038498878479, -0.30537378787994385, -0.2926436960697174, -0.27991363406181335, -0.2671835422515869, -0.25445348024368286, -0.24172340333461761, -0.22899332642555237, -0.21626323461532593, -0.20353315770626068, -0.19080308079719543, -0.17807301878929138, -0.16534294188022614, -0.1526128649711609, -0.13988278806209564, -0.1271527111530304, -0.11442264914512634, -0.1016925722360611, -0.08896250277757645, -0.0762324258685112, -0.06350235641002655, -0.050772279500961304, -0.03804220259189606, -0.025312133133411407, -0.012582056224346161, 0.00014801789075136185, 0.012878092005848885, 0.025608167052268982, 0.03833824023604393, 0.05106831341981888, 0.06379839032888412, 0.07652845978736877, 0.08925853669643402, 0.10198861360549927, 0.11471868306398392, 0.12744876742362976, 0.1401788294315338, 0.15290890634059906, 0.1656389832496643, 0.17836904525756836, 0.1910991370677948, 0.20382921397686005, 0.2165592908859253, 0.22928935289382935, 0.2420194298028946, 0.25474950671195984, 0.2674795985221863, 0.28020966053009033, 0.2929397225379944]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 8.0, 9.0, 12.0, 11.0, 11.0, 13.0, 18.0, 21.0, 27.0, 20.0, 27.0, 35.0, 34.0, 31.0, 36.0, 26.0, 37.0, 38.0, 34.0, 43.0, 37.0, 37.0, 32.0, 40.0, 40.0, 35.0, 38.0, 30.0, 31.0, 25.0, 29.0, 22.0, 10.0, 24.0, 15.0, 8.0, 13.0, 6.0, 6.0, 3.0, 3.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.16210085153579712, -0.1570567488670349, -0.1520126461982727, -0.1469685435295105, -0.1419244408607483, -0.13688033819198608, -0.13183623552322388, -0.12679213285446167, -0.12174802273511887, -0.11670392006635666, -0.11165981739759445, -0.10661571472883224, -0.10157160460948944, -0.09652750194072723, -0.09148339927196503, -0.08643929660320282, -0.08139519393444061, -0.0763510912656784, -0.0713069885969162, -0.06626288592815399, -0.061218779534101486, -0.05617467686533928, -0.051130570471286774, -0.04608646780252457, -0.04104236513376236, -0.03599826246500015, -0.030954157933592796, -0.02591005340218544, -0.020865950733423233, -0.015821848064661026, -0.01077774353325367, -0.0057336390018463135, -0.0006895363330841064, 0.004354567267000675, 0.009398670867085457, 0.014442774467170238, 0.01948687806725502, 0.024530980736017227, 0.029575085267424583, 0.03461918979883194, 0.03966329246759415, 0.044707395136356354, 0.04975149780511856, 0.054795604199171066, 0.05983970686793327, 0.06488381326198578, 0.06992791593074799, 0.07497201859951019, 0.0800161212682724, 0.0850602239370346, 0.09010432660579681, 0.09514842927455902, 0.10019253194332123, 0.10523663461208344, 0.11028074473142624, 0.11532484740018845, 0.12036895006895065, 0.12541306018829346, 0.13045716285705566, 0.13550126552581787, 0.14054536819458008, 0.14558947086334229, 0.1506335735321045, 0.1556776762008667, 0.1607217788696289]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 9.0, 12.0, 17.0, 14.0, 34.0, 50.0, 81.0, 153.0, 253.0, 598.0, 1599.0, 5862.0, 24405.0, 204218.0, 2425098.0, 1411697.0, 99275.0, 14193.0, 4186.0, 1537.0, 510.0, 200.0, 103.0, 49.0, 34.0, 29.0, 13.0, 11.0, 12.0, 2.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08258056640625, -0.08006668090820312, -0.07755279541015625, -0.07503890991210938, -0.0725250244140625, -0.07001113891601562, -0.06749725341796875, -0.06498336791992188, -0.062469482421875, -0.059955596923828125, -0.05744171142578125, -0.054927825927734375, -0.0524139404296875, -0.049900054931640625, -0.04738616943359375, -0.044872283935546875, -0.0423583984375, -0.039844512939453125, -0.03733062744140625, -0.034816741943359375, -0.0323028564453125, -0.029788970947265625, -0.02727508544921875, -0.024761199951171875, -0.022247314453125, -0.019733428955078125, -0.01721954345703125, -0.014705657958984375, -0.0121917724609375, -0.009677886962890625, -0.00716400146484375, -0.004650115966796875, -0.00213623046875, 0.000377655029296875, 0.00289154052734375, 0.005405426025390625, 0.0079193115234375, 0.010433197021484375, 0.01294708251953125, 0.015460968017578125, 0.017974853515625, 0.020488739013671875, 0.02300262451171875, 0.025516510009765625, 0.0280303955078125, 0.030544281005859375, 0.03305816650390625, 0.035572052001953125, 0.0380859375, 0.040599822998046875, 0.04311370849609375, 0.045627593994140625, 0.0481414794921875, 0.050655364990234375, 0.05316925048828125, 0.055683135986328125, 0.058197021484375, 0.060710906982421875, 0.06322479248046875, 0.06573867797851562, 0.0682525634765625, 0.07076644897460938, 0.07328033447265625, 0.07579421997070312, 0.07830810546875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 15.0, 36.0, 56.0, 89.0, 104.0, 117.0, 137.0, 143.0, 106.0, 73.0, 65.0, 36.0, 12.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0975341796875, -0.09486007690429688, -0.09218597412109375, -0.08951187133789062, -0.0868377685546875, -0.08416366577148438, -0.08148956298828125, -0.07881546020507812, -0.076141357421875, -0.07346725463867188, -0.07079315185546875, -0.06811904907226562, -0.0654449462890625, -0.06277084350585938, -0.06009674072265625, -0.057422637939453125, -0.05474853515625, -0.052074432373046875, -0.04940032958984375, -0.046726226806640625, -0.0440521240234375, -0.041378021240234375, -0.03870391845703125, -0.036029815673828125, -0.033355712890625, -0.030681610107421875, -0.02800750732421875, -0.025333404541015625, -0.0226593017578125, -0.019985198974609375, -0.01731109619140625, -0.014636993408203125, -0.011962890625, -0.009288787841796875, -0.00661468505859375, -0.003940582275390625, -0.0012664794921875, 0.001407623291015625, 0.00408172607421875, 0.006755828857421875, 0.009429931640625, 0.012104034423828125, 0.01477813720703125, 0.017452239990234375, 0.0201263427734375, 0.022800445556640625, 0.02547454833984375, 0.028148651123046875, 0.03082275390625, 0.033496856689453125, 0.03617095947265625, 0.038845062255859375, 0.0415191650390625, 0.044193267822265625, 0.04686737060546875, 0.049541473388671875, 0.052215576171875, 0.054889678955078125, 0.05756378173828125, 0.060237884521484375, 0.0629119873046875, 0.06558609008789062, 0.06826019287109375, 0.07093429565429688, 0.0736083984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 13.0, 16.0, 25.0, 35.0, 52.0, 74.0, 89.0, 124.0, 201.0, 449.0, 1074.0, 3799.0, 23412.0, 249159.0, 3226751.0, 634470.0, 45203.0, 6462.0, 1528.0, 573.0, 270.0, 151.0, 89.0, 68.0, 35.0, 45.0, 22.0, 15.0, 16.0, 10.0, 4.0, 7.0, 2.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09747314453125, -0.09448814392089844, -0.09150314331054688, -0.08851814270019531, -0.08553314208984375, -0.08254814147949219, -0.07956314086914062, -0.07657814025878906, -0.0735931396484375, -0.07060813903808594, -0.06762313842773438, -0.06463813781738281, -0.06165313720703125, -0.05866813659667969, -0.055683135986328125, -0.05269813537597656, -0.049713134765625, -0.04672813415527344, -0.043743133544921875, -0.04075813293457031, -0.03777313232421875, -0.03478813171386719, -0.031803131103515625, -0.028818130493164062, -0.0258331298828125, -0.022848129272460938, -0.019863128662109375, -0.016878128051757812, -0.01389312744140625, -0.010908126831054688, -0.007923126220703125, -0.0049381256103515625, -0.001953125, 0.0010318756103515625, 0.004016876220703125, 0.0070018768310546875, 0.00998687744140625, 0.012971878051757812, 0.015956878662109375, 0.018941879272460938, 0.0219268798828125, 0.024911880493164062, 0.027896881103515625, 0.030881881713867188, 0.03386688232421875, 0.03685188293457031, 0.039836883544921875, 0.04282188415527344, 0.045806884765625, 0.04879188537597656, 0.051776885986328125, 0.05476188659667969, 0.05774688720703125, 0.06073188781738281, 0.06371688842773438, 0.06670188903808594, 0.0696868896484375, 0.07267189025878906, 0.07565689086914062, 0.07864189147949219, 0.08162689208984375, 0.08461189270019531, 0.08759689331054688, 0.09058189392089844, 0.09356689453125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 4.0, 6.0, 13.0, 14.0, 14.0, 31.0, 44.0, 71.0, 82.0, 129.0, 166.0, 271.0, 421.0, 550.0, 591.0, 490.0, 340.0, 275.0, 182.0, 111.0, 62.0, 64.0, 48.0, 34.0, 13.0, 16.0, 7.0, 10.0, 2.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.072509765625, -0.07066917419433594, -0.06882858276367188, -0.06698799133300781, -0.06514739990234375, -0.06330680847167969, -0.061466217041015625, -0.05962562561035156, -0.0577850341796875, -0.05594444274902344, -0.054103851318359375, -0.05226325988769531, -0.05042266845703125, -0.04858207702636719, -0.046741485595703125, -0.04490089416503906, -0.043060302734375, -0.04121971130371094, -0.039379119873046875, -0.03753852844238281, -0.03569793701171875, -0.03385734558105469, -0.032016754150390625, -0.030176162719726562, -0.0283355712890625, -0.026494979858398438, -0.024654388427734375, -0.022813796997070312, -0.02097320556640625, -0.019132614135742188, -0.017292022705078125, -0.015451431274414062, -0.01361083984375, -0.011770248413085938, -0.009929656982421875, -0.008089065551757812, -0.00624847412109375, -0.0044078826904296875, -0.002567291259765625, -0.0007266998291015625, 0.0011138916015625, 0.0029544830322265625, 0.004795074462890625, 0.0066356658935546875, 0.00847625732421875, 0.010316848754882812, 0.012157440185546875, 0.013998031616210938, 0.015838623046875, 0.017679214477539062, 0.019519805908203125, 0.021360397338867188, 0.02320098876953125, 0.025041580200195312, 0.026882171630859375, 0.028722763061523438, 0.0305633544921875, 0.03240394592285156, 0.034244537353515625, 0.03608512878417969, 0.03792572021484375, 0.03976631164550781, 0.041606903076171875, 0.04344749450683594, 0.0452880859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 9.0, 12.0, 24.0, 46.0, 108.0, 143.0, 187.0, 173.0, 127.0, 79.0, 52.0, 22.0, 9.0, 2.0, 7.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.43141767382621765, -0.41530224680900574, -0.39918678998947144, -0.3830713629722595, -0.3669559359550476, -0.3508405089378357, -0.3347250819206238, -0.3186096251010895, -0.30249419808387756, -0.28637877106666565, -0.27026331424713135, -0.25414788722991943, -0.23803246021270752, -0.2219170331954956, -0.2058015912771225, -0.1896861493587494, -0.17357072234153748, -0.15745529532432556, -0.14133985340595245, -0.12522441148757935, -0.10910898447036743, -0.09299355000257492, -0.07687811553478241, -0.0607626810669899, -0.04464724659919739, -0.028531812131404877, -0.012416377663612366, 0.0036990568041801453, 0.019814491271972656, 0.03592992573976517, 0.05204536020755768, 0.06816079467535019, 0.08427619934082031, 0.10039163380861282, 0.11650706827640533, 0.13262251019477844, 0.14873793721199036, 0.16485336422920227, 0.18096880614757538, 0.1970842480659485, 0.2131996750831604, 0.22931510210037231, 0.24543054401874542, 0.26154598593711853, 0.27766141295433044, 0.29377683997154236, 0.30989229679107666, 0.3260077238082886, 0.3421231508255005, 0.3582385778427124, 0.3743540048599243, 0.3904694616794586, 0.40658488869667053, 0.42270031571388245, 0.43881577253341675, 0.45493119955062866, 0.4710466265678406, 0.4871620535850525, 0.5032774806022644, 0.5193929076194763, 0.535508394241333, 0.5516238212585449, 0.5677392482757568, 0.5838546752929688, 0.5999701023101807]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 3.0, 5.0, 9.0, 12.0, 6.0, 13.0, 18.0, 20.0, 19.0, 28.0, 26.0, 31.0, 24.0, 37.0, 22.0, 38.0, 45.0, 36.0, 39.0, 28.0, 36.0, 42.0, 39.0, 39.0, 31.0, 34.0, 36.0, 26.0, 30.0, 31.0, 19.0, 27.0, 28.0, 18.0, 18.0, 17.0, 11.0, 10.0, 10.0, 7.0, 7.0, 4.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12657690048217773, -0.12231141328811646, -0.11804593354463577, -0.11378045380115509, -0.10951496660709381, -0.10524947941303253, -0.10098399966955185, -0.09671851992607117, -0.09245303273200989, -0.08818754553794861, -0.08392206579446793, -0.07965658605098724, -0.07539109885692596, -0.07112561166286469, -0.066860131919384, -0.06259465217590332, -0.05832916498184204, -0.05406368151307106, -0.04979819804430008, -0.0455327145755291, -0.04126723110675812, -0.03700174763798714, -0.032736264169216156, -0.028470780700445175, -0.024205297231674194, -0.019939813762903214, -0.015674330294132233, -0.011408846825361252, -0.007143363356590271, -0.00287787988781929, 0.0013876035809516907, 0.0056530870497226715, 0.009918570518493652, 0.014184053987264633, 0.018449537456035614, 0.022715020924806595, 0.026980504393577576, 0.031245987862348557, 0.03551147133111954, 0.03977695479989052, 0.0440424382686615, 0.04830792173743248, 0.05257340520620346, 0.05683888867497444, 0.06110437214374542, 0.0653698593378067, 0.06963533908128738, 0.07390081882476807, 0.07816630601882935, 0.08243179321289062, 0.08669727295637131, 0.09096275269985199, 0.09522823989391327, 0.09949372708797455, 0.10375920683145523, 0.10802468657493591, 0.11229017376899719, 0.11655566096305847, 0.12082114070653915, 0.12508662045001984, 0.12935210764408112, 0.1336175948381424, 0.13788306713104248, 0.14214855432510376, 0.14641404151916504]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 10.0, 11.0, 15.0, 12.0, 22.0, 55.0, 63.0, 91.0, 110.0, 195.0, 269.0, 504.0, 941.0, 2139.0, 5384.0, 14347.0, 45575.0, 155854.0, 398491.0, 291895.0, 89623.0, 26838.0, 9202.0, 3586.0, 1500.0, 709.0, 354.0, 231.0, 160.0, 114.0, 93.0, 54.0, 26.0, 16.0, 22.0, 12.0, 11.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07843017578125, -0.0758819580078125, -0.073333740234375, -0.0707855224609375, -0.0682373046875, -0.0656890869140625, -0.063140869140625, -0.0605926513671875, -0.05804443359375, -0.0554962158203125, -0.052947998046875, -0.0503997802734375, -0.0478515625, -0.0453033447265625, -0.042755126953125, -0.0402069091796875, -0.03765869140625, -0.0351104736328125, -0.032562255859375, -0.0300140380859375, -0.0274658203125, -0.0249176025390625, -0.022369384765625, -0.0198211669921875, -0.01727294921875, -0.0147247314453125, -0.012176513671875, -0.0096282958984375, -0.007080078125, -0.0045318603515625, -0.001983642578125, 0.0005645751953125, 0.00311279296875, 0.0056610107421875, 0.008209228515625, 0.0107574462890625, 0.0133056640625, 0.0158538818359375, 0.018402099609375, 0.0209503173828125, 0.02349853515625, 0.0260467529296875, 0.028594970703125, 0.0311431884765625, 0.03369140625, 0.0362396240234375, 0.038787841796875, 0.0413360595703125, 0.04388427734375, 0.0464324951171875, 0.048980712890625, 0.0515289306640625, 0.0540771484375, 0.0566253662109375, 0.059173583984375, 0.0617218017578125, 0.06427001953125, 0.0668182373046875, 0.069366455078125, 0.0719146728515625, 0.074462890625, 0.0770111083984375, 0.079559326171875, 0.0821075439453125, 0.08465576171875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 8.0, 8.0, 30.0, 41.0, 50.0, 73.0, 102.0, 116.0, 116.0, 136.0, 106.0, 67.0, 60.0, 35.0, 26.0, 21.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.090576171875, -0.08809566497802734, -0.08561515808105469, -0.08313465118408203, -0.08065414428710938, -0.07817363739013672, -0.07569313049316406, -0.0732126235961914, -0.07073211669921875, -0.0682516098022461, -0.06577110290527344, -0.06329059600830078, -0.060810089111328125, -0.05832958221435547, -0.05584907531738281, -0.053368568420410156, -0.0508880615234375, -0.048407554626464844, -0.04592704772949219, -0.04344654083251953, -0.040966033935546875, -0.03848552703857422, -0.03600502014160156, -0.033524513244628906, -0.03104400634765625, -0.028563499450683594, -0.026082992553710938, -0.02360248565673828, -0.021121978759765625, -0.01864147186279297, -0.016160964965820312, -0.013680458068847656, -0.011199951171875, -0.008719444274902344, -0.0062389373779296875, -0.0037584304809570312, -0.001277923583984375, 0.0012025833129882812, 0.0036830902099609375, 0.006163597106933594, 0.00864410400390625, 0.011124610900878906, 0.013605117797851562, 0.01608562469482422, 0.018566131591796875, 0.02104663848876953, 0.023527145385742188, 0.026007652282714844, 0.0284881591796875, 0.030968666076660156, 0.03344917297363281, 0.03592967987060547, 0.038410186767578125, 0.04089069366455078, 0.04337120056152344, 0.045851707458496094, 0.04833221435546875, 0.050812721252441406, 0.05329322814941406, 0.05577373504638672, 0.058254241943359375, 0.06073474884033203, 0.06321525573730469, 0.06569576263427734, 0.06817626953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 10.0, 9.0, 19.0, 25.0, 33.0, 64.0, 99.0, 178.0, 314.0, 624.0, 1570.0, 4350.0, 14334.0, 55264.0, 249911.0, 502400.0, 165724.0, 37812.0, 10175.0, 3244.0, 1234.0, 539.0, 249.0, 154.0, 89.0, 41.0, 40.0, 13.0, 16.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078369140625, -0.07550525665283203, -0.07264137268066406, -0.0697774887084961, -0.06691360473632812, -0.06404972076416016, -0.06118583679199219, -0.05832195281982422, -0.05545806884765625, -0.05259418487548828, -0.04973030090332031, -0.046866416931152344, -0.044002532958984375, -0.041138648986816406, -0.03827476501464844, -0.03541088104248047, -0.0325469970703125, -0.02968311309814453, -0.026819229125976562, -0.023955345153808594, -0.021091461181640625, -0.018227577209472656, -0.015363693237304688, -0.012499809265136719, -0.00963592529296875, -0.006772041320800781, -0.0039081573486328125, -0.0010442733764648438, 0.001819610595703125, 0.004683494567871094, 0.0075473785400390625, 0.010411262512207031, 0.013275146484375, 0.01613903045654297, 0.019002914428710938, 0.021866798400878906, 0.024730682373046875, 0.027594566345214844, 0.030458450317382812, 0.03332233428955078, 0.03618621826171875, 0.03905010223388672, 0.04191398620605469, 0.044777870178222656, 0.047641754150390625, 0.050505638122558594, 0.05336952209472656, 0.05623340606689453, 0.0590972900390625, 0.06196117401123047, 0.06482505798339844, 0.0676889419555664, 0.07055282592773438, 0.07341670989990234, 0.07628059387207031, 0.07914447784423828, 0.08200836181640625, 0.08487224578857422, 0.08773612976074219, 0.09060001373291016, 0.09346389770507812, 0.0963277816772461, 0.09919166564941406, 0.10205554962158203, 0.10491943359375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 11.0, 9.0, 10.0, 20.0, 18.0, 14.0, 28.0, 23.0, 32.0, 31.0, 27.0, 42.0, 53.0, 41.0, 44.0, 42.0, 49.0, 47.0, 32.0, 41.0, 41.0, 40.0, 46.0, 31.0, 25.0, 22.0, 26.0, 23.0, 16.0, 20.0, 15.0, 7.0, 12.0, 14.0, 10.0, 7.0, 2.0, 4.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07342529296875, -0.0708150863647461, -0.06820487976074219, -0.06559467315673828, -0.06298446655273438, -0.06037425994873047, -0.05776405334472656, -0.055153846740722656, -0.05254364013671875, -0.049933433532714844, -0.04732322692871094, -0.04471302032470703, -0.042102813720703125, -0.03949260711669922, -0.03688240051269531, -0.034272193908691406, -0.0316619873046875, -0.029051780700683594, -0.026441574096679688, -0.02383136749267578, -0.021221160888671875, -0.01861095428466797, -0.016000747680664062, -0.013390541076660156, -0.01078033447265625, -0.008170127868652344, -0.0055599212646484375, -0.0029497146606445312, -0.000339508056640625, 0.0022706985473632812, 0.0048809051513671875, 0.007491111755371094, 0.010101318359375, 0.012711524963378906, 0.015321731567382812, 0.01793193817138672, 0.020542144775390625, 0.02315235137939453, 0.025762557983398438, 0.028372764587402344, 0.03098297119140625, 0.033593177795410156, 0.03620338439941406, 0.03881359100341797, 0.041423797607421875, 0.04403400421142578, 0.04664421081542969, 0.049254417419433594, 0.0518646240234375, 0.054474830627441406, 0.05708503723144531, 0.05969524383544922, 0.062305450439453125, 0.06491565704345703, 0.06752586364746094, 0.07013607025146484, 0.07274627685546875, 0.07535648345947266, 0.07796669006347656, 0.08057689666748047, 0.08318710327148438, 0.08579730987548828, 0.08840751647949219, 0.0910177230834961, 0.0936279296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 9.0, 14.0, 17.0, 18.0, 42.0, 52.0, 51.0, 78.0, 116.0, 182.0, 287.0, 379.0, 652.0, 1096.0, 1820.0, 3169.0, 5355.0, 9492.0, 17592.0, 34141.0, 70181.0, 163784.0, 319102.0, 229501.0, 95356.0, 44460.0, 22831.0, 12244.0, 6850.0, 3842.0, 2257.0, 1299.0, 794.0, 486.0, 317.0, 206.0, 139.0, 103.0, 64.0, 53.0, 39.0, 20.0, 14.0, 13.0, 14.0, 4.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.01806640625, -0.017530202865600586, -0.016993999481201172, -0.016457796096801758, -0.015921592712402344, -0.01538538932800293, -0.014849185943603516, -0.014312982559204102, -0.013776779174804688, -0.013240575790405273, -0.01270437240600586, -0.012168169021606445, -0.011631965637207031, -0.011095762252807617, -0.010559558868408203, -0.010023355484008789, -0.009487152099609375, -0.008950948715209961, -0.008414745330810547, -0.007878541946411133, -0.007342338562011719, -0.006806135177612305, -0.006269931793212891, -0.0057337284088134766, -0.0051975250244140625, -0.0046613216400146484, -0.004125118255615234, -0.0035889148712158203, -0.0030527114868164062, -0.002516508102416992, -0.001980304718017578, -0.001444101333618164, -0.00090789794921875, -0.00037169456481933594, 0.00016450881958007812, 0.0007007122039794922, 0.0012369155883789062, 0.0017731189727783203, 0.0023093223571777344, 0.0028455257415771484, 0.0033817291259765625, 0.0039179325103759766, 0.004454135894775391, 0.004990339279174805, 0.005526542663574219, 0.006062746047973633, 0.006598949432373047, 0.007135152816772461, 0.007671356201171875, 0.008207559585571289, 0.008743762969970703, 0.009279966354370117, 0.009816169738769531, 0.010352373123168945, 0.01088857650756836, 0.011424779891967773, 0.011960983276367188, 0.012497186660766602, 0.013033390045166016, 0.01356959342956543, 0.014105796813964844, 0.014642000198364258, 0.015178203582763672, 0.015714406967163086, 0.0162506103515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 5.0, 5.0, 3.0, 12.0, 12.0, 13.0, 42.0, 42.0, 49.0, 95.0, 117.0, 127.0, 91.0, 92.0, 91.0, 46.0, 41.0, 27.0, 11.0, 16.0, 12.0, 4.0, 3.0, 1.0, 2.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1801719665527344e-05, -1.1362135410308838e-05, -1.0922551155090332e-05, -1.0482966899871826e-05, -1.004338264465332e-05, -9.603798389434814e-06, -9.164214134216309e-06, -8.724629878997803e-06, -8.285045623779297e-06, -7.845461368560791e-06, -7.405877113342285e-06, -6.966292858123779e-06, -6.5267086029052734e-06, -6.087124347686768e-06, -5.647540092468262e-06, -5.207955837249756e-06, -4.76837158203125e-06, -4.328787326812744e-06, -3.889203071594238e-06, -3.4496188163757324e-06, -3.0100345611572266e-06, -2.5704503059387207e-06, -2.130866050720215e-06, -1.691281795501709e-06, -1.2516975402832031e-06, -8.121132850646973e-07, -3.725290298461914e-07, 6.705522537231445e-08, 5.066394805908203e-07, 9.462237358093262e-07, 1.385807991027832e-06, 1.8253922462463379e-06, 2.2649765014648438e-06, 2.7045607566833496e-06, 3.1441450119018555e-06, 3.5837292671203613e-06, 4.023313522338867e-06, 4.462897777557373e-06, 4.902482032775879e-06, 5.342066287994385e-06, 5.781650543212891e-06, 6.2212347984313965e-06, 6.660819053649902e-06, 7.100403308868408e-06, 7.539987564086914e-06, 7.97957181930542e-06, 8.419156074523926e-06, 8.858740329742432e-06, 9.298324584960938e-06, 9.737908840179443e-06, 1.017749309539795e-05, 1.0617077350616455e-05, 1.1056661605834961e-05, 1.1496245861053467e-05, 1.1935830116271973e-05, 1.2375414371490479e-05, 1.2814998626708984e-05, 1.325458288192749e-05, 1.3694167137145996e-05, 1.4133751392364502e-05, 1.4573335647583008e-05, 1.5012919902801514e-05, 1.545250415802002e-05, 1.5892088413238525e-05, 1.633167266845703e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 7.0, 15.0, 18.0, 30.0, 44.0, 76.0, 98.0, 159.0, 256.0, 448.0, 806.0, 1534.0, 3428.0, 7766.0, 18789.0, 47001.0, 124971.0, 305617.0, 317410.0, 133834.0, 50543.0, 20026.0, 8238.0, 3724.0, 1649.0, 857.0, 450.0, 263.0, 162.0, 108.0, 74.0, 59.0, 29.0, 15.0, 10.0, 8.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01873779296875, -0.018044710159301758, -0.017351627349853516, -0.016658544540405273, -0.01596546173095703, -0.015272378921508789, -0.014579296112060547, -0.013886213302612305, -0.013193130493164062, -0.01250004768371582, -0.011806964874267578, -0.011113882064819336, -0.010420799255371094, -0.009727716445922852, -0.00903463363647461, -0.008341550827026367, -0.007648468017578125, -0.006955385208129883, -0.006262302398681641, -0.0055692195892333984, -0.004876136779785156, -0.004183053970336914, -0.003489971160888672, -0.0027968883514404297, -0.0021038055419921875, -0.0014107227325439453, -0.0007176399230957031, -2.4557113647460938e-05, 0.0006685256958007812, 0.0013616085052490234, 0.0020546913146972656, 0.002747774124145508, 0.00344085693359375, 0.004133939743041992, 0.004827022552490234, 0.0055201053619384766, 0.006213188171386719, 0.006906270980834961, 0.007599353790283203, 0.008292436599731445, 0.008985519409179688, 0.00967860221862793, 0.010371685028076172, 0.011064767837524414, 0.011757850646972656, 0.012450933456420898, 0.01314401626586914, 0.013837099075317383, 0.014530181884765625, 0.015223264694213867, 0.01591634750366211, 0.01660943031311035, 0.017302513122558594, 0.017995595932006836, 0.018688678741455078, 0.01938176155090332, 0.020074844360351562, 0.020767927169799805, 0.021461009979248047, 0.02215409278869629, 0.02284717559814453, 0.023540258407592773, 0.024233341217041016, 0.024926424026489258, 0.0256195068359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 3.0, 4.0, 3.0, 3.0, 5.0, 9.0, 7.0, 7.0, 15.0, 12.0, 13.0, 21.0, 19.0, 33.0, 36.0, 48.0, 56.0, 59.0, 76.0, 55.0, 70.0, 65.0, 64.0, 53.0, 50.0, 47.0, 26.0, 28.0, 23.0, 20.0, 14.0, 15.0, 10.0, 11.0, 11.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01904296875, -0.01841259002685547, -0.017782211303710938, -0.017151832580566406, -0.016521453857421875, -0.015891075134277344, -0.015260696411132812, -0.014630317687988281, -0.01399993896484375, -0.013369560241699219, -0.012739181518554688, -0.012108802795410156, -0.011478424072265625, -0.010848045349121094, -0.010217666625976562, -0.009587287902832031, -0.0089569091796875, -0.008326530456542969, -0.0076961517333984375, -0.007065773010253906, -0.006435394287109375, -0.005805015563964844, -0.0051746368408203125, -0.004544258117675781, -0.00391387939453125, -0.0032835006713867188, -0.0026531219482421875, -0.0020227432250976562, -0.001392364501953125, -0.0007619857788085938, -0.0001316070556640625, 0.0004987716674804688, 0.001129150390625, 0.0017595291137695312, 0.0023899078369140625, 0.0030202865600585938, 0.003650665283203125, 0.004281044006347656, 0.0049114227294921875, 0.005541801452636719, 0.00617218017578125, 0.006802558898925781, 0.0074329376220703125, 0.008063316345214844, 0.008693695068359375, 0.009324073791503906, 0.009954452514648438, 0.010584831237792969, 0.0112152099609375, 0.011845588684082031, 0.012475967407226562, 0.013106346130371094, 0.013736724853515625, 0.014367103576660156, 0.014997482299804688, 0.01562786102294922, 0.01625823974609375, 0.01688861846923828, 0.017518997192382812, 0.018149375915527344, 0.018779754638671875, 0.019410133361816406, 0.020040512084960938, 0.02067089080810547, 0.02130126953125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 15.0, 21.0, 67.0, 113.0, 252.0, 213.0, 183.0, 79.0, 39.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6898530125617981, -0.6707860827445984, -0.6517190933227539, -0.6326521635055542, -0.6135851740837097, -0.59451824426651, -0.5754512548446655, -0.5563843250274658, -0.5373173952102661, -0.5182504653930664, -0.4991834759712219, -0.48011651635169983, -0.46104955673217773, -0.441982626914978, -0.42291566729545593, -0.40384870767593384, -0.38478171825408936, -0.36571475863456726, -0.34664779901504517, -0.32758083939552307, -0.308513879776001, -0.28944694995880127, -0.2703799903392792, -0.2513130307197571, -0.23224607110023499, -0.2131791114807129, -0.1941121518611908, -0.1750452071428299, -0.1559782475233078, -0.1369112879037857, -0.11784433573484421, -0.09877738356590271, -0.07971048355102539, -0.060643527656793594, -0.0415765717625618, -0.022509615868330002, -0.0034426599740982056, 0.01562429964542389, 0.03469125181436539, 0.053758203983306885, 0.07282516360282898, 0.09189212322235107, 0.11095907539129257, 0.13002602756023407, 0.14909298717975616, 0.16815994679927826, 0.18722689151763916, 0.20629385113716125, 0.22536081075668335, 0.24442777037620544, 0.26349472999572754, 0.28256168961524963, 0.30162864923477173, 0.32069557905197144, 0.33976253867149353, 0.3588294982910156, 0.3778964579105377, 0.3969634175300598, 0.4160303771495819, 0.435097336769104, 0.4541642665863037, 0.4732312560081482, 0.4922981858253479, 0.5113651752471924, 0.5304321050643921]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 9.0, 5.0, 12.0, 15.0, 14.0, 19.0, 30.0, 26.0, 27.0, 24.0, 26.0, 30.0, 42.0, 34.0, 27.0, 37.0, 40.0, 43.0, 40.0, 44.0, 46.0, 42.0, 37.0, 36.0, 26.0, 31.0, 19.0, 33.0, 21.0, 14.0, 26.0, 14.0, 21.0, 15.0, 4.0, 8.0, 12.0, 6.0, 4.0, 7.0, 6.0, 2.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17511945962905884, -0.16959434747695923, -0.1640692502260208, -0.1585441380739212, -0.1530190259218216, -0.14749392867088318, -0.14196881651878357, -0.13644370436668396, -0.13091859221458435, -0.12539348006248474, -0.11986837536096573, -0.11434327065944672, -0.1088181585073471, -0.1032930538058281, -0.09776794910430908, -0.09224283695220947, -0.08671773970127106, -0.08119263499975204, -0.07566752284765244, -0.07014241814613342, -0.06461730599403381, -0.0590922012925148, -0.05356709659099579, -0.04804198816418648, -0.04251687973737717, -0.036991771310567856, -0.031466662883758545, -0.025941558182239532, -0.02041644975543022, -0.01489134132862091, -0.009366236627101898, -0.0038411282002925873, 0.0016839802265167236, 0.00720908772200346, 0.012734195217490196, 0.018259301781654358, 0.02378441020846367, 0.02930951863527298, 0.03483462333679199, 0.0403597317636013, 0.045884840190410614, 0.051409948617219925, 0.056935057044029236, 0.06246016174554825, 0.06798526644706726, 0.07351037859916687, 0.07903548330068588, 0.0845605880022049, 0.0900857001543045, 0.09561080485582352, 0.10113591700792313, 0.10666102170944214, 0.11218613386154175, 0.11771123856306076, 0.12323634326457977, 0.12876145541667938, 0.1342865526676178, 0.1398116648197174, 0.14533676207065582, 0.15086187422275543, 0.15638698637485504, 0.16191208362579346, 0.16743719577789307, 0.17296230792999268, 0.17848742008209229]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 7.0, 7.0, 11.0, 15.0, 13.0, 26.0, 33.0, 66.0, 113.0, 201.0, 375.0, 932.0, 2980.0, 8666.0, 30005.0, 200298.0, 1525250.0, 2033348.0, 330343.0, 45204.0, 10122.0, 3619.0, 1627.0, 571.0, 186.0, 110.0, 48.0, 36.0, 19.0, 18.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.07940530776977539, -0.07720661163330078, -0.07500791549682617, -0.07280921936035156, -0.07061052322387695, -0.06841182708740234, -0.06621313095092773, -0.06401443481445312, -0.061815738677978516, -0.059617042541503906, -0.0574183464050293, -0.05521965026855469, -0.05302095413208008, -0.05082225799560547, -0.04862356185913086, -0.04642486572265625, -0.04422616958618164, -0.04202747344970703, -0.03982877731323242, -0.03763008117675781, -0.0354313850402832, -0.033232688903808594, -0.031033992767333984, -0.028835296630859375, -0.026636600494384766, -0.024437904357910156, -0.022239208221435547, -0.020040512084960938, -0.017841815948486328, -0.01564311981201172, -0.01344442367553711, -0.0112457275390625, -0.00904703140258789, -0.006848335266113281, -0.004649639129638672, -0.0024509429931640625, -0.0002522468566894531, 0.0019464492797851562, 0.004145145416259766, 0.006343841552734375, 0.008542537689208984, 0.010741233825683594, 0.012939929962158203, 0.015138626098632812, 0.017337322235107422, 0.01953601837158203, 0.02173471450805664, 0.02393341064453125, 0.02613210678100586, 0.02833080291748047, 0.030529499053955078, 0.03272819519042969, 0.0349268913269043, 0.037125587463378906, 0.039324283599853516, 0.041522979736328125, 0.043721675872802734, 0.045920372009277344, 0.04811906814575195, 0.05031776428222656, 0.05251646041870117, 0.05471515655517578, 0.05691385269165039, 0.059112548828125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 11.0, 24.0, 34.0, 67.0, 73.0, 106.0, 130.0, 116.0, 116.0, 110.0, 73.0, 53.0, 49.0, 20.0, 13.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09759521484375, -0.09492111206054688, -0.09224700927734375, -0.08957290649414062, -0.0868988037109375, -0.08422470092773438, -0.08155059814453125, -0.07887649536132812, -0.076202392578125, -0.07352828979492188, -0.07085418701171875, -0.06818008422851562, -0.0655059814453125, -0.06283187866210938, -0.06015777587890625, -0.057483673095703125, -0.0548095703125, -0.052135467529296875, -0.04946136474609375, -0.046787261962890625, -0.0441131591796875, -0.041439056396484375, -0.03876495361328125, -0.036090850830078125, -0.033416748046875, -0.030742645263671875, -0.02806854248046875, -0.025394439697265625, -0.0227203369140625, -0.020046234130859375, -0.01737213134765625, -0.014698028564453125, -0.01202392578125, -0.009349822998046875, -0.00667572021484375, -0.004001617431640625, -0.0013275146484375, 0.001346588134765625, 0.00402069091796875, 0.006694793701171875, 0.009368896484375, 0.012042999267578125, 0.01471710205078125, 0.017391204833984375, 0.0200653076171875, 0.022739410400390625, 0.02541351318359375, 0.028087615966796875, 0.03076171875, 0.033435821533203125, 0.03610992431640625, 0.038784027099609375, 0.0414581298828125, 0.044132232666015625, 0.04680633544921875, 0.049480438232421875, 0.052154541015625, 0.054828643798828125, 0.05750274658203125, 0.060176849365234375, 0.0628509521484375, 0.06552505493164062, 0.06819915771484375, 0.07087326049804688, 0.07354736328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 14.0, 18.0, 23.0, 26.0, 44.0, 35.0, 46.0, 76.0, 129.0, 351.0, 1500.0, 17378.0, 2487778.0, 1671169.0, 13639.0, 1289.0, 329.0, 139.0, 75.0, 52.0, 48.0, 26.0, 22.0, 15.0, 7.0, 12.0, 10.0, 8.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.19091796875, -0.184326171875, -0.177734375, -0.171142578125, -0.16455078125, -0.157958984375, -0.1513671875, -0.144775390625, -0.13818359375, -0.131591796875, -0.125, -0.118408203125, -0.11181640625, -0.105224609375, -0.0986328125, -0.092041015625, -0.08544921875, -0.078857421875, -0.072265625, -0.065673828125, -0.05908203125, -0.052490234375, -0.0458984375, -0.039306640625, -0.03271484375, -0.026123046875, -0.01953125, -0.012939453125, -0.00634765625, 0.000244140625, 0.0068359375, 0.013427734375, 0.02001953125, 0.026611328125, 0.033203125, 0.039794921875, 0.04638671875, 0.052978515625, 0.0595703125, 0.066162109375, 0.07275390625, 0.079345703125, 0.0859375, 0.092529296875, 0.09912109375, 0.105712890625, 0.1123046875, 0.118896484375, 0.12548828125, 0.132080078125, 0.138671875, 0.145263671875, 0.15185546875, 0.158447265625, 0.1650390625, 0.171630859375, 0.17822265625, 0.184814453125, 0.19140625, 0.197998046875, 0.20458984375, 0.211181640625, 0.2177734375, 0.224365234375, 0.23095703125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 8.0, 12.0, 12.0, 12.0, 20.0, 40.0, 68.0, 93.0, 141.0, 233.0, 401.0, 534.0, 727.0, 603.0, 449.0, 256.0, 183.0, 98.0, 72.0, 44.0, 24.0, 13.0, 11.0, 10.0, 8.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.108154296875, -0.10561656951904297, -0.10307884216308594, -0.1005411148071289, -0.09800338745117188, -0.09546566009521484, -0.09292793273925781, -0.09039020538330078, -0.08785247802734375, -0.08531475067138672, -0.08277702331542969, -0.08023929595947266, -0.07770156860351562, -0.0751638412475586, -0.07262611389160156, -0.07008838653564453, -0.0675506591796875, -0.06501293182373047, -0.06247520446777344, -0.059937477111816406, -0.057399749755859375, -0.054862022399902344, -0.05232429504394531, -0.04978656768798828, -0.04724884033203125, -0.04471111297607422, -0.04217338562011719, -0.039635658264160156, -0.037097930908203125, -0.034560203552246094, -0.03202247619628906, -0.02948474884033203, -0.026947021484375, -0.02440929412841797, -0.021871566772460938, -0.019333839416503906, -0.016796112060546875, -0.014258384704589844, -0.011720657348632812, -0.009182929992675781, -0.00664520263671875, -0.004107475280761719, -0.0015697479248046875, 0.0009679794311523438, 0.003505706787109375, 0.006043434143066406, 0.008581161499023438, 0.011118888854980469, 0.0136566162109375, 0.01619434356689453, 0.018732070922851562, 0.021269798278808594, 0.023807525634765625, 0.026345252990722656, 0.028882980346679688, 0.03142070770263672, 0.03395843505859375, 0.03649616241455078, 0.03903388977050781, 0.041571617126464844, 0.044109344482421875, 0.046647071838378906, 0.04918479919433594, 0.05172252655029297, 0.05426025390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 14.0, 39.0, 121.0, 250.0, 270.0, 193.0, 75.0, 22.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1342246532440186, -1.103812575340271, -1.0734004974365234, -1.0429884195327759, -1.0125763416290283, -0.9821643233299255, -0.9517523050308228, -0.9213402271270752, -0.8909281492233276, -0.8605160713195801, -0.8301039934158325, -0.7996919751167297, -0.7692798972129822, -0.7388678193092346, -0.7084558010101318, -0.6780437231063843, -0.6476316452026367, -0.6172195672988892, -0.5868074893951416, -0.5563954710960388, -0.5259833931922913, -0.4955713152885437, -0.46515926718711853, -0.43474721908569336, -0.4043351411819458, -0.37392306327819824, -0.34351101517677307, -0.3130989670753479, -0.28268688917160034, -0.2522748112678528, -0.2218627631664276, -0.19145070016384125, -0.16103863716125488, -0.13062657415866852, -0.10021451115608215, -0.06980244815349579, -0.039390385150909424, -0.008978322148323059, 0.021433740854263306, 0.05184580385684967, 0.08225786685943604, 0.1126699298620224, 0.14308199286460876, 0.17349405586719513, 0.2039061188697815, 0.23431818187236786, 0.2647302448749542, 0.2951422929763794, 0.32555437088012695, 0.3559664487838745, 0.3863784968852997, 0.41679054498672485, 0.4472026228904724, 0.47761470079421997, 0.5080267190933228, 0.5384387969970703, 0.5688508749008179, 0.5992629528045654, 0.629675030708313, 0.6600870490074158, 0.6904991269111633, 0.7209112048149109, 0.7513232231140137, 0.7817353010177612, 0.8121473789215088]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 5.0, 7.0, 7.0, 8.0, 8.0, 11.0, 6.0, 11.0, 23.0, 27.0, 31.0, 21.0, 18.0, 28.0, 35.0, 46.0, 38.0, 38.0, 49.0, 32.0, 42.0, 40.0, 46.0, 44.0, 30.0, 40.0, 41.0, 46.0, 34.0, 38.0, 20.0, 21.0, 16.0, 14.0, 15.0, 12.0, 14.0, 4.0, 6.0, 6.0, 2.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.17921161651611328, -0.17352086305618286, -0.16783012449741364, -0.1621393859386444, -0.156448632478714, -0.15075787901878357, -0.14506714046001434, -0.13937640190124512, -0.1336856484413147, -0.12799489498138428, -0.12230415642261505, -0.11661341041326523, -0.1109226644039154, -0.10523191839456558, -0.09954117238521576, -0.09385042637586594, -0.08815968036651611, -0.08246893435716629, -0.07677818834781647, -0.07108744233846664, -0.06539669632911682, -0.059705950319767, -0.054015204310417175, -0.04832445830106735, -0.04263371229171753, -0.036942966282367706, -0.03125222027301788, -0.02556147426366806, -0.019870728254318237, -0.014179982244968414, -0.008489236235618591, -0.0027984902262687683, 0.0028922557830810547, 0.008583001792430878, 0.0142737478017807, 0.019964493811130524, 0.025655239820480347, 0.03134598582983017, 0.03703673183917999, 0.042727477848529816, 0.04841822385787964, 0.05410896986722946, 0.059799715876579285, 0.06549046188592911, 0.07118120789527893, 0.07687195390462875, 0.08256269991397858, 0.0882534459233284, 0.09394419193267822, 0.09963493794202805, 0.10532568395137787, 0.11101642996072769, 0.11670717597007751, 0.12239792197942734, 0.12808866798877716, 0.1337794065475464, 0.1394701600074768, 0.14516091346740723, 0.15085165202617645, 0.15654239058494568, 0.1622331440448761, 0.16792389750480652, 0.17361463606357574, 0.17930537462234497, 0.1849961280822754]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 13.0, 16.0, 29.0, 41.0, 80.0, 140.0, 219.0, 419.0, 827.0, 1648.0, 4041.0, 11739.0, 43406.0, 201342.0, 488821.0, 226169.0, 48854.0, 12673.0, 4367.0, 1836.0, 858.0, 445.0, 241.0, 114.0, 68.0, 52.0, 35.0, 15.0, 4.0, 12.0, 13.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.07864093780517578, -0.07567787170410156, -0.07271480560302734, -0.06975173950195312, -0.0667886734008789, -0.06382560729980469, -0.06086254119873047, -0.05789947509765625, -0.05493640899658203, -0.05197334289550781, -0.049010276794433594, -0.046047210693359375, -0.043084144592285156, -0.04012107849121094, -0.03715801239013672, -0.0341949462890625, -0.03123188018798828, -0.028268814086914062, -0.025305747985839844, -0.022342681884765625, -0.019379615783691406, -0.016416549682617188, -0.013453483581542969, -0.01049041748046875, -0.007527351379394531, -0.0045642852783203125, -0.0016012191772460938, 0.001361846923828125, 0.004324913024902344, 0.0072879791259765625, 0.010251045227050781, 0.013214111328125, 0.01617717742919922, 0.019140243530273438, 0.022103309631347656, 0.025066375732421875, 0.028029441833496094, 0.030992507934570312, 0.03395557403564453, 0.03691864013671875, 0.03988170623779297, 0.04284477233886719, 0.045807838439941406, 0.048770904541015625, 0.051733970642089844, 0.05469703674316406, 0.05766010284423828, 0.0606231689453125, 0.06358623504638672, 0.06654930114746094, 0.06951236724853516, 0.07247543334960938, 0.0754384994506836, 0.07840156555175781, 0.08136463165283203, 0.08432769775390625, 0.08729076385498047, 0.09025382995605469, 0.0932168960571289, 0.09617996215820312, 0.09914302825927734, 0.10210609436035156, 0.10506916046142578, 0.1080322265625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 15.0, 13.0, 38.0, 40.0, 76.0, 77.0, 99.0, 127.0, 117.0, 89.0, 95.0, 85.0, 54.0, 32.0, 24.0, 9.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10540771484375, -0.1025705337524414, -0.09973335266113281, -0.09689617156982422, -0.09405899047851562, -0.09122180938720703, -0.08838462829589844, -0.08554744720458984, -0.08271026611328125, -0.07987308502197266, -0.07703590393066406, -0.07419872283935547, -0.07136154174804688, -0.06852436065673828, -0.06568717956542969, -0.0628499984741211, -0.0600128173828125, -0.057175636291503906, -0.05433845520019531, -0.05150127410888672, -0.048664093017578125, -0.04582691192626953, -0.04298973083496094, -0.040152549743652344, -0.03731536865234375, -0.034478187561035156, -0.03164100646972656, -0.02880382537841797, -0.025966644287109375, -0.02312946319580078, -0.020292282104492188, -0.017455101013183594, -0.014617919921875, -0.011780738830566406, -0.008943557739257812, -0.006106376647949219, -0.003269195556640625, -0.00043201446533203125, 0.0024051666259765625, 0.005242347717285156, 0.00807952880859375, 0.010916709899902344, 0.013753890991210938, 0.01659107208251953, 0.019428253173828125, 0.02226543426513672, 0.025102615356445312, 0.027939796447753906, 0.0307769775390625, 0.033614158630371094, 0.03645133972167969, 0.03928852081298828, 0.042125701904296875, 0.04496288299560547, 0.04780006408691406, 0.050637245178222656, 0.05347442626953125, 0.056311607360839844, 0.05914878845214844, 0.06198596954345703, 0.06482315063476562, 0.06766033172607422, 0.07049751281738281, 0.0733346939086914, 0.076171875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 10.0, 23.0, 18.0, 33.0, 40.0, 55.0, 94.0, 90.0, 169.0, 305.0, 502.0, 1010.0, 1923.0, 3922.0, 8255.0, 19052.0, 52272.0, 165177.0, 371303.0, 275282.0, 93447.0, 31522.0, 12417.0, 5764.0, 2672.0, 1388.0, 720.0, 431.0, 218.0, 122.0, 81.0, 64.0, 37.0, 20.0, 29.0, 23.0, 18.0, 10.0, 6.0, 4.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06304931640625, -0.06106376647949219, -0.059078216552734375, -0.05709266662597656, -0.05510711669921875, -0.05312156677246094, -0.051136016845703125, -0.04915046691894531, -0.0471649169921875, -0.04517936706542969, -0.043193817138671875, -0.04120826721191406, -0.03922271728515625, -0.03723716735839844, -0.035251617431640625, -0.03326606750488281, -0.031280517578125, -0.029294967651367188, -0.027309417724609375, -0.025323867797851562, -0.02333831787109375, -0.021352767944335938, -0.019367218017578125, -0.017381668090820312, -0.0153961181640625, -0.013410568237304688, -0.011425018310546875, -0.009439468383789062, -0.00745391845703125, -0.0054683685302734375, -0.003482818603515625, -0.0014972686767578125, 0.00048828125, 0.0024738311767578125, 0.004459381103515625, 0.0064449310302734375, 0.00843048095703125, 0.010416030883789062, 0.012401580810546875, 0.014387130737304688, 0.0163726806640625, 0.018358230590820312, 0.020343780517578125, 0.022329330444335938, 0.02431488037109375, 0.026300430297851562, 0.028285980224609375, 0.030271530151367188, 0.032257080078125, 0.03424263000488281, 0.036228179931640625, 0.03821372985839844, 0.04019927978515625, 0.04218482971191406, 0.044170379638671875, 0.04615592956542969, 0.0481414794921875, 0.05012702941894531, 0.052112579345703125, 0.05409812927246094, 0.05608367919921875, 0.05806922912597656, 0.060054779052734375, 0.06204032897949219, 0.06402587890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 7.0, 13.0, 11.0, 16.0, 13.0, 18.0, 20.0, 12.0, 22.0, 24.0, 31.0, 34.0, 42.0, 40.0, 39.0, 44.0, 42.0, 36.0, 56.0, 35.0, 46.0, 49.0, 33.0, 31.0, 35.0, 26.0, 39.0, 39.0, 25.0, 18.0, 17.0, 13.0, 13.0, 11.0, 8.0, 8.0, 11.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.095703125, -0.09285736083984375, -0.0900115966796875, -0.08716583251953125, -0.084320068359375, -0.08147430419921875, -0.0786285400390625, -0.07578277587890625, -0.07293701171875, -0.07009124755859375, -0.0672454833984375, -0.06439971923828125, -0.061553955078125, -0.05870819091796875, -0.0558624267578125, -0.05301666259765625, -0.0501708984375, -0.04732513427734375, -0.0444793701171875, -0.04163360595703125, -0.038787841796875, -0.03594207763671875, -0.0330963134765625, -0.03025054931640625, -0.02740478515625, -0.02455902099609375, -0.0217132568359375, -0.01886749267578125, -0.016021728515625, -0.01317596435546875, -0.0103302001953125, -0.00748443603515625, -0.004638671875, -0.00179290771484375, 0.0010528564453125, 0.00389862060546875, 0.006744384765625, 0.00959014892578125, 0.0124359130859375, 0.01528167724609375, 0.01812744140625, 0.02097320556640625, 0.0238189697265625, 0.02666473388671875, 0.029510498046875, 0.03235626220703125, 0.0352020263671875, 0.03804779052734375, 0.0408935546875, 0.04373931884765625, 0.0465850830078125, 0.04943084716796875, 0.052276611328125, 0.05512237548828125, 0.0579681396484375, 0.06081390380859375, 0.06365966796875, 0.06650543212890625, 0.0693511962890625, 0.07219696044921875, 0.075042724609375, 0.07788848876953125, 0.0807342529296875, 0.08358001708984375, 0.08642578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 6.0, 6.0, 11.0, 16.0, 26.0, 46.0, 79.0, 144.0, 214.0, 430.0, 859.0, 1919.0, 4190.0, 10441.0, 28707.0, 93904.0, 309335.0, 391774.0, 140974.0, 40897.0, 14117.0, 5693.0, 2396.0, 1121.0, 555.0, 294.0, 150.0, 98.0, 56.0, 25.0, 28.0, 16.0, 4.0, 10.0, 7.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0220947265625, -0.021385669708251953, -0.020676612854003906, -0.01996755599975586, -0.019258499145507812, -0.018549442291259766, -0.01784038543701172, -0.017131328582763672, -0.016422271728515625, -0.015713214874267578, -0.015004158020019531, -0.014295101165771484, -0.013586044311523438, -0.01287698745727539, -0.012167930603027344, -0.011458873748779297, -0.01074981689453125, -0.010040760040283203, -0.009331703186035156, -0.00862264633178711, -0.007913589477539062, -0.007204532623291016, -0.006495475769042969, -0.005786418914794922, -0.005077362060546875, -0.004368305206298828, -0.0036592483520507812, -0.0029501914978027344, -0.0022411346435546875, -0.0015320777893066406, -0.0008230209350585938, -0.00011396408081054688, 0.0005950927734375, 0.0013041496276855469, 0.0020132064819335938, 0.0027222633361816406, 0.0034313201904296875, 0.004140377044677734, 0.004849433898925781, 0.005558490753173828, 0.006267547607421875, 0.006976604461669922, 0.007685661315917969, 0.008394718170166016, 0.009103775024414062, 0.00981283187866211, 0.010521888732910156, 0.011230945587158203, 0.01194000244140625, 0.012649059295654297, 0.013358116149902344, 0.01406717300415039, 0.014776229858398438, 0.015485286712646484, 0.01619434356689453, 0.016903400421142578, 0.017612457275390625, 0.018321514129638672, 0.01903057098388672, 0.019739627838134766, 0.020448684692382812, 0.02115774154663086, 0.021866798400878906, 0.022575855255126953, 0.023284912109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 9.0, 4.0, 13.0, 28.0, 21.0, 36.0, 48.0, 54.0, 58.0, 80.0, 95.0, 79.0, 75.0, 88.0, 72.0, 50.0, 50.0, 28.0, 22.0, 29.0, 13.0, 12.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1622905731201172e-05, -1.130625605583191e-05, -1.0989606380462646e-05, -1.0672956705093384e-05, -1.0356307029724121e-05, -1.0039657354354858e-05, -9.723007678985596e-06, -9.406358003616333e-06, -9.08970832824707e-06, -8.773058652877808e-06, -8.456408977508545e-06, -8.139759302139282e-06, -7.82310962677002e-06, -7.506459951400757e-06, -7.189810276031494e-06, -6.8731606006622314e-06, -6.556510925292969e-06, -6.239861249923706e-06, -5.923211574554443e-06, -5.606561899185181e-06, -5.289912223815918e-06, -4.973262548446655e-06, -4.656612873077393e-06, -4.33996319770813e-06, -4.023313522338867e-06, -3.7066638469696045e-06, -3.390014171600342e-06, -3.073364496231079e-06, -2.7567148208618164e-06, -2.4400651454925537e-06, -2.123415470123291e-06, -1.8067657947540283e-06, -1.4901161193847656e-06, -1.173466444015503e-06, -8.568167686462402e-07, -5.401670932769775e-07, -2.2351741790771484e-07, 9.313225746154785e-08, 4.0978193283081055e-07, 7.264316082000732e-07, 1.043081283569336e-06, 1.3597309589385986e-06, 1.6763806343078613e-06, 1.993030309677124e-06, 2.3096799850463867e-06, 2.6263296604156494e-06, 2.942979335784912e-06, 3.259629011154175e-06, 3.5762786865234375e-06, 3.8929283618927e-06, 4.209578037261963e-06, 4.526227712631226e-06, 4.842877388000488e-06, 5.159527063369751e-06, 5.476176738739014e-06, 5.792826414108276e-06, 6.109476089477539e-06, 6.426125764846802e-06, 6.7427754402160645e-06, 7.059425115585327e-06, 7.37607479095459e-06, 7.692724466323853e-06, 8.009374141693115e-06, 8.326023817062378e-06, 8.64267349243164e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 8.0, 12.0, 18.0, 27.0, 34.0, 48.0, 64.0, 99.0, 151.0, 249.0, 391.0, 626.0, 971.0, 1648.0, 3119.0, 6188.0, 13455.0, 32098.0, 83215.0, 204149.0, 321335.0, 221929.0, 93345.0, 36122.0, 14653.0, 6614.0, 3225.0, 1879.0, 1041.0, 617.0, 405.0, 270.0, 176.0, 116.0, 69.0, 42.0, 39.0, 25.0, 20.0, 15.0, 9.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.020294189453125, -0.01970696449279785, -0.019119739532470703, -0.018532514572143555, -0.017945289611816406, -0.017358064651489258, -0.01677083969116211, -0.01618361473083496, -0.015596389770507812, -0.015009164810180664, -0.014421939849853516, -0.013834714889526367, -0.013247489929199219, -0.01266026496887207, -0.012073040008544922, -0.011485815048217773, -0.010898590087890625, -0.010311365127563477, -0.009724140167236328, -0.00913691520690918, -0.008549690246582031, -0.007962465286254883, -0.007375240325927734, -0.006788015365600586, -0.0062007904052734375, -0.005613565444946289, -0.005026340484619141, -0.004439115524291992, -0.0038518905639648438, -0.0032646656036376953, -0.002677440643310547, -0.0020902156829833984, -0.00150299072265625, -0.0009157657623291016, -0.0003285408020019531, 0.0002586841583251953, 0.0008459091186523438, 0.0014331340789794922, 0.0020203590393066406, 0.002607583999633789, 0.0031948089599609375, 0.003782033920288086, 0.004369258880615234, 0.004956483840942383, 0.005543708801269531, 0.00613093376159668, 0.006718158721923828, 0.0073053836822509766, 0.007892608642578125, 0.008479833602905273, 0.009067058563232422, 0.00965428352355957, 0.010241508483886719, 0.010828733444213867, 0.011415958404541016, 0.012003183364868164, 0.012590408325195312, 0.013177633285522461, 0.01376485824584961, 0.014352083206176758, 0.014939308166503906, 0.015526533126831055, 0.016113758087158203, 0.01670098304748535, 0.0172882080078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 8.0, 15.0, 15.0, 22.0, 24.0, 40.0, 58.0, 57.0, 66.0, 60.0, 80.0, 84.0, 68.0, 79.0, 58.0, 62.0, 39.0, 43.0, 21.0, 20.0, 20.0, 13.0, 10.0, 6.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0222320556640625, -0.02142810821533203, -0.020624160766601562, -0.019820213317871094, -0.019016265869140625, -0.018212318420410156, -0.017408370971679688, -0.01660442352294922, -0.01580047607421875, -0.014996528625488281, -0.014192581176757812, -0.013388633728027344, -0.012584686279296875, -0.011780738830566406, -0.010976791381835938, -0.010172843933105469, -0.009368896484375, -0.008564949035644531, -0.0077610015869140625, -0.006957054138183594, -0.006153106689453125, -0.005349159240722656, -0.0045452117919921875, -0.0037412643432617188, -0.00293731689453125, -0.0021333694458007812, -0.0013294219970703125, -0.0005254745483398438, 0.000278472900390625, 0.0010824203491210938, 0.0018863677978515625, 0.0026903152465820312, 0.0034942626953125, 0.004298210144042969, 0.0051021575927734375, 0.005906105041503906, 0.006710052490234375, 0.007513999938964844, 0.008317947387695312, 0.009121894836425781, 0.00992584228515625, 0.010729789733886719, 0.011533737182617188, 0.012337684631347656, 0.013141632080078125, 0.013945579528808594, 0.014749526977539062, 0.015553474426269531, 0.016357421875, 0.01716136932373047, 0.017965316772460938, 0.018769264221191406, 0.019573211669921875, 0.020377159118652344, 0.021181106567382812, 0.02198505401611328, 0.02278900146484375, 0.02359294891357422, 0.024396896362304688, 0.025200843811035156, 0.026004791259765625, 0.026808738708496094, 0.027612686157226562, 0.02841663360595703, 0.0292205810546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 14.0, 24.0, 74.0, 160.0, 241.0, 206.0, 138.0, 70.0, 30.0, 21.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5351487994194031, -0.5176911950111389, -0.5002336502075195, -0.48277607560157776, -0.465318500995636, -0.4478608965873718, -0.43040332198143005, -0.4129457473754883, -0.3954881727695465, -0.37803059816360474, -0.36057302355766296, -0.3431154489517212, -0.32565784454345703, -0.30820029973983765, -0.2907426953315735, -0.2732851207256317, -0.25582754611968994, -0.23836997151374817, -0.2209123969078064, -0.20345480740070343, -0.18599723279476166, -0.16853965818881989, -0.15108206868171692, -0.13362449407577515, -0.11616691946983337, -0.0987093448638916, -0.08125176280736923, -0.06379418075084686, -0.04633660614490509, -0.028879031538963318, -0.011421449482440948, 0.006036132574081421, 0.023493647575378418, 0.04095122590661049, 0.05840880423784256, 0.07586638629436493, 0.0933239609003067, 0.11078153550624847, 0.12823912501335144, 0.1456966996192932, 0.16315427422523499, 0.18061184883117676, 0.19806942343711853, 0.2155270129442215, 0.23298458755016327, 0.25044214725494385, 0.267899751663208, 0.2853573262691498, 0.30281490087509155, 0.3202724754810333, 0.3377300500869751, 0.35518762469291687, 0.37264519929885864, 0.3901028037071228, 0.4075603783130646, 0.42501795291900635, 0.4424755275249481, 0.4599331021308899, 0.47739067673683167, 0.49484825134277344, 0.5123058557510376, 0.529763400554657, 0.5472210049629211, 0.5646785497665405, 0.5821361541748047]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 0.0, 6.0, 5.0, 4.0, 5.0, 8.0, 9.0, 17.0, 15.0, 12.0, 23.0, 29.0, 34.0, 26.0, 33.0, 28.0, 44.0, 44.0, 43.0, 55.0, 49.0, 36.0, 46.0, 43.0, 34.0, 47.0, 32.0, 37.0, 26.0, 27.0, 33.0, 23.0, 28.0, 19.0, 16.0, 17.0, 12.0, 7.0, 5.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.18936187028884888, -0.18273046612739563, -0.1760990470647812, -0.16946764290332794, -0.1628362387418747, -0.15620481967926025, -0.149573415517807, -0.14294201135635376, -0.1363106071949005, -0.12967920303344727, -0.12304779142141342, -0.11641637980937958, -0.10978497564792633, -0.10315356403589249, -0.09652215242385864, -0.0898907482624054, -0.08325932919979095, -0.07662791758775711, -0.06999651342630386, -0.06336510181427002, -0.056733693927526474, -0.05010228604078293, -0.043470874428749084, -0.03683946654200554, -0.030208058655261993, -0.023576650768518448, -0.016945241019129753, -0.010313831269741058, -0.003682423382997513, 0.0029489845037460327, 0.009580396115779877, 0.016211804002523422, 0.022843211889266968, 0.029474619776010513, 0.03610602766275406, 0.0427374392747879, 0.04936884716153145, 0.056000255048274994, 0.06263166666030884, 0.06926307082176208, 0.07589448243379593, 0.08252589404582977, 0.08915729820728302, 0.09578870981931686, 0.10242012143135071, 0.10905152559280396, 0.1156829372048378, 0.12231434881687164, 0.1289457529783249, 0.13557715713977814, 0.14220857620239258, 0.14883998036384583, 0.15547138452529907, 0.16210278868675232, 0.16873420774936676, 0.17536561191082, 0.18199703097343445, 0.1886284351348877, 0.19525985419750214, 0.20189125835895538, 0.20852266252040863, 0.21515408158302307, 0.22178548574447632, 0.22841688990592957, 0.2350482940673828]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 5.0, 2.0, 7.0, 19.0, 24.0, 35.0, 59.0, 74.0, 117.0, 207.0, 389.0, 738.0, 1624.0, 3455.0, 7242.0, 16631.0, 50392.0, 210212.0, 859342.0, 1748526.0, 966408.0, 240051.0, 57188.0, 17256.0, 6922.0, 3437.0, 1940.0, 963.0, 431.0, 213.0, 124.0, 80.0, 53.0, 33.0, 21.0, 24.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05535888671875, -0.0537567138671875, -0.052154541015625, -0.0505523681640625, -0.0489501953125, -0.0473480224609375, -0.045745849609375, -0.0441436767578125, -0.04254150390625, -0.0409393310546875, -0.039337158203125, -0.0377349853515625, -0.0361328125, -0.0345306396484375, -0.032928466796875, -0.0313262939453125, -0.02972412109375, -0.0281219482421875, -0.026519775390625, -0.0249176025390625, -0.0233154296875, -0.0217132568359375, -0.020111083984375, -0.0185089111328125, -0.01690673828125, -0.0153045654296875, -0.013702392578125, -0.0121002197265625, -0.010498046875, -0.0088958740234375, -0.007293701171875, -0.0056915283203125, -0.00408935546875, -0.0024871826171875, -0.000885009765625, 0.0007171630859375, 0.0023193359375, 0.0039215087890625, 0.005523681640625, 0.0071258544921875, 0.00872802734375, 0.0103302001953125, 0.011932373046875, 0.0135345458984375, 0.01513671875, 0.0167388916015625, 0.018341064453125, 0.0199432373046875, 0.02154541015625, 0.0231475830078125, 0.024749755859375, 0.0263519287109375, 0.0279541015625, 0.0295562744140625, 0.031158447265625, 0.0327606201171875, 0.03436279296875, 0.0359649658203125, 0.037567138671875, 0.0391693115234375, 0.040771484375, 0.0423736572265625, 0.043975830078125, 0.0455780029296875, 0.04718017578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 12.0, 22.0, 28.0, 42.0, 64.0, 89.0, 120.0, 99.0, 116.0, 114.0, 92.0, 51.0, 59.0, 47.0, 22.0, 12.0, 4.0, 10.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09124755859375, -0.08865070343017578, -0.08605384826660156, -0.08345699310302734, -0.08086013793945312, -0.0782632827758789, -0.07566642761230469, -0.07306957244873047, -0.07047271728515625, -0.06787586212158203, -0.06527900695800781, -0.0626821517944336, -0.060085296630859375, -0.057488441467285156, -0.05489158630371094, -0.05229473114013672, -0.0496978759765625, -0.04710102081298828, -0.04450416564941406, -0.041907310485839844, -0.039310455322265625, -0.036713600158691406, -0.03411674499511719, -0.03151988983154297, -0.02892303466796875, -0.02632617950439453, -0.023729324340820312, -0.021132469177246094, -0.018535614013671875, -0.015938758850097656, -0.013341903686523438, -0.010745048522949219, -0.008148193359375, -0.005551338195800781, -0.0029544830322265625, -0.00035762786865234375, 0.002239227294921875, 0.004836082458496094, 0.0074329376220703125, 0.010029792785644531, 0.01262664794921875, 0.015223503112792969, 0.017820358276367188, 0.020417213439941406, 0.023014068603515625, 0.025610923767089844, 0.028207778930664062, 0.03080463409423828, 0.0334014892578125, 0.03599834442138672, 0.03859519958496094, 0.041192054748535156, 0.043788909912109375, 0.046385765075683594, 0.04898262023925781, 0.05157947540283203, 0.05417633056640625, 0.05677318572998047, 0.05937004089355469, 0.061966896057128906, 0.06456375122070312, 0.06716060638427734, 0.06975746154785156, 0.07235431671142578, 0.074951171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 4.0, 5.0, 11.0, 17.0, 15.0, 21.0, 21.0, 39.0, 43.0, 55.0, 74.0, 135.0, 288.0, 503.0, 1082.0, 3150.0, 11795.0, 74482.0, 1740795.0, 2253412.0, 89040.0, 13380.0, 3433.0, 1166.0, 528.0, 280.0, 160.0, 97.0, 60.0, 45.0, 36.0, 22.0, 23.0, 13.0, 9.0, 8.0, 5.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.115966796875, -0.1121063232421875, -0.108245849609375, -0.1043853759765625, -0.10052490234375, -0.0966644287109375, -0.092803955078125, -0.0889434814453125, -0.0850830078125, -0.0812225341796875, -0.077362060546875, -0.0735015869140625, -0.06964111328125, -0.0657806396484375, -0.061920166015625, -0.0580596923828125, -0.05419921875, -0.0503387451171875, -0.046478271484375, -0.0426177978515625, -0.03875732421875, -0.0348968505859375, -0.031036376953125, -0.0271759033203125, -0.0233154296875, -0.0194549560546875, -0.015594482421875, -0.0117340087890625, -0.00787353515625, -0.0040130615234375, -0.000152587890625, 0.0037078857421875, 0.007568359375, 0.0114288330078125, 0.015289306640625, 0.0191497802734375, 0.02301025390625, 0.0268707275390625, 0.030731201171875, 0.0345916748046875, 0.0384521484375, 0.0423126220703125, 0.046173095703125, 0.0500335693359375, 0.05389404296875, 0.0577545166015625, 0.061614990234375, 0.0654754638671875, 0.0693359375, 0.0731964111328125, 0.077056884765625, 0.0809173583984375, 0.08477783203125, 0.0886383056640625, 0.092498779296875, 0.0963592529296875, 0.1002197265625, 0.1040802001953125, 0.107940673828125, 0.1118011474609375, 0.11566162109375, 0.1195220947265625, 0.123382568359375, 0.1272430419921875, 0.131103515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 5.0, 26.0, 20.0, 30.0, 56.0, 75.0, 117.0, 146.0, 226.0, 355.0, 508.0, 645.0, 609.0, 435.0, 286.0, 144.0, 103.0, 83.0, 41.0, 34.0, 36.0, 18.0, 17.0, 11.0, 10.0, 3.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.07464599609375, -0.07212638854980469, -0.06960678100585938, -0.06708717346191406, -0.06456756591796875, -0.06204795837402344, -0.059528350830078125, -0.05700874328613281, -0.0544891357421875, -0.05196952819824219, -0.049449920654296875, -0.04693031311035156, -0.04441070556640625, -0.04189109802246094, -0.039371490478515625, -0.03685188293457031, -0.034332275390625, -0.03181266784667969, -0.029293060302734375, -0.026773452758789062, -0.02425384521484375, -0.021734237670898438, -0.019214630126953125, -0.016695022583007812, -0.0141754150390625, -0.011655807495117188, -0.009136199951171875, -0.0066165924072265625, -0.00409698486328125, -0.0015773773193359375, 0.000942230224609375, 0.0034618377685546875, 0.0059814453125, 0.008501052856445312, 0.011020660400390625, 0.013540267944335938, 0.01605987548828125, 0.018579483032226562, 0.021099090576171875, 0.023618698120117188, 0.0261383056640625, 0.028657913208007812, 0.031177520751953125, 0.03369712829589844, 0.03621673583984375, 0.03873634338378906, 0.041255950927734375, 0.04377555847167969, 0.046295166015625, 0.04881477355957031, 0.051334381103515625, 0.05385398864746094, 0.05637359619140625, 0.05889320373535156, 0.061412811279296875, 0.06393241882324219, 0.0664520263671875, 0.06897163391113281, 0.07149124145507812, 0.07401084899902344, 0.07653045654296875, 0.07905006408691406, 0.08156967163085938, 0.08408927917480469, 0.08660888671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 13.0, 24.0, 54.0, 117.0, 199.0, 252.0, 179.0, 82.0, 34.0, 17.0, 12.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2369219064712524, -1.20773184299469, -1.1785417795181274, -1.1493515968322754, -1.120161533355713, -1.0909714698791504, -1.061781406402588, -1.0325913429260254, -1.003401279449463, -0.9742112159729004, -0.9450210928916931, -0.9158310294151306, -0.8866409659385681, -0.8574508428573608, -0.8282607793807983, -0.7990707159042358, -0.7698805928230286, -0.7406905293464661, -0.7115004062652588, -0.6823103427886963, -0.6531202793121338, -0.6239302158355713, -0.594740092754364, -0.5655500292778015, -0.5363599061965942, -0.5071698427200317, -0.47797974944114685, -0.44878965616226196, -0.41959959268569946, -0.3904094994068146, -0.3612194061279297, -0.3320293426513672, -0.3028392791748047, -0.2736491858959198, -0.2444591224193573, -0.2152690291404724, -0.18607895076274872, -0.15688887238502502, -0.12769877910614014, -0.09850870072841644, -0.06931862235069275, -0.04012854024767876, -0.010938458144664764, 0.018251627683639526, 0.04744170606136322, 0.07663178443908691, 0.1058218777179718, 0.1350119560956955, 0.1642020344734192, 0.19339211285114288, 0.22258219122886658, 0.25177228450775146, 0.28096234798431396, 0.31015244126319885, 0.33934253454208374, 0.36853259801864624, 0.39772269129753113, 0.426912784576416, 0.4561028480529785, 0.4852929413318634, 0.5144830346107483, 0.5436730980873108, 0.5728632211685181, 0.6020532846450806, 0.6312433481216431]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 5.0, 7.0, 17.0, 20.0, 17.0, 19.0, 23.0, 40.0, 39.0, 28.0, 32.0, 51.0, 52.0, 55.0, 46.0, 44.0, 51.0, 59.0, 40.0, 44.0, 39.0, 34.0, 41.0, 32.0, 27.0, 23.0, 21.0, 11.0, 21.0, 17.0, 14.0, 10.0, 4.0, 4.0, 3.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.3009309768676758, -0.2929282784461975, -0.28492555022239685, -0.2769228518009186, -0.2689201235771179, -0.26091742515563965, -0.2529147267341614, -0.24491199851036072, -0.23690930008888245, -0.22890658676624298, -0.22090387344360352, -0.21290117502212524, -0.20489846169948578, -0.1968957483768463, -0.18889303505420685, -0.18089032173156738, -0.17288760840892792, -0.16488489508628845, -0.156882181763649, -0.14887946844100952, -0.14087677001953125, -0.13287405669689178, -0.12487134337425232, -0.11686863005161285, -0.10886592417955399, -0.10086321085691452, -0.09286050498485565, -0.08485779166221619, -0.07685507833957672, -0.06885237246751785, -0.06084965914487839, -0.05284694954752922, -0.044844239950180054, -0.03684153035283089, -0.02883881889283657, -0.020836107432842255, -0.012833397835493088, -0.004830688238143921, 0.0031720250844955444, 0.011174734681844711, 0.019177444279193878, 0.027180153876543045, 0.03518286347389221, 0.04318557679653168, 0.051188286393880844, 0.05919099599123001, 0.06719370931386948, 0.07519641518592834, 0.08319912850856781, 0.09120184183120728, 0.09920454770326614, 0.10720726102590561, 0.11520996689796448, 0.12321268022060394, 0.1312153935432434, 0.13921810686588287, 0.14722082018852234, 0.1552235335111618, 0.16322624683380127, 0.17122894525527954, 0.179231658577919, 0.18723437190055847, 0.19523708522319794, 0.2032397985458374, 0.21124249696731567]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 5.0, 12.0, 22.0, 19.0, 14.0, 35.0, 35.0, 53.0, 84.0, 197.0, 483.0, 1688.0, 10102.0, 113646.0, 647331.0, 249344.0, 21352.0, 2811.0, 697.0, 270.0, 128.0, 60.0, 39.0, 32.0, 15.0, 25.0, 12.0, 13.0, 9.0, 10.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1649169921875, -0.1598682403564453, -0.15481948852539062, -0.14977073669433594, -0.14472198486328125, -0.13967323303222656, -0.13462448120117188, -0.1295757293701172, -0.1245269775390625, -0.11947822570800781, -0.11442947387695312, -0.10938072204589844, -0.10433197021484375, -0.09928321838378906, -0.09423446655273438, -0.08918571472167969, -0.084136962890625, -0.07908821105957031, -0.07403945922851562, -0.06899070739746094, -0.06394195556640625, -0.05889320373535156, -0.053844451904296875, -0.04879570007324219, -0.0437469482421875, -0.03869819641113281, -0.033649444580078125, -0.028600692749023438, -0.02355194091796875, -0.018503189086914062, -0.013454437255859375, -0.008405685424804688, -0.00335693359375, 0.0016918182373046875, 0.006740570068359375, 0.011789321899414062, 0.01683807373046875, 0.021886825561523438, 0.026935577392578125, 0.03198432922363281, 0.0370330810546875, 0.04208183288574219, 0.047130584716796875, 0.05217933654785156, 0.05722808837890625, 0.06227684020996094, 0.06732559204101562, 0.07237434387207031, 0.077423095703125, 0.08247184753417969, 0.08752059936523438, 0.09256935119628906, 0.09761810302734375, 0.10266685485839844, 0.10771560668945312, 0.11276435852050781, 0.1178131103515625, 0.12286186218261719, 0.12791061401367188, 0.13295936584472656, 0.13800811767578125, 0.14305686950683594, 0.14810562133789062, 0.1531543731689453, 0.158203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 14.0, 28.0, 24.0, 33.0, 45.0, 51.0, 63.0, 92.0, 99.0, 81.0, 80.0, 81.0, 65.0, 58.0, 55.0, 33.0, 28.0, 31.0, 16.0, 6.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09381103515625, -0.09125804901123047, -0.08870506286621094, -0.0861520767211914, -0.08359909057617188, -0.08104610443115234, -0.07849311828613281, -0.07594013214111328, -0.07338714599609375, -0.07083415985107422, -0.06828117370605469, -0.06572818756103516, -0.06317520141601562, -0.060622215270996094, -0.05806922912597656, -0.05551624298095703, -0.0529632568359375, -0.05041027069091797, -0.04785728454589844, -0.045304298400878906, -0.042751312255859375, -0.040198326110839844, -0.03764533996582031, -0.03509235382080078, -0.03253936767578125, -0.02998638153076172, -0.027433395385742188, -0.024880409240722656, -0.022327423095703125, -0.019774436950683594, -0.017221450805664062, -0.014668464660644531, -0.012115478515625, -0.009562492370605469, -0.0070095062255859375, -0.004456520080566406, -0.001903533935546875, 0.0006494522094726562, 0.0032024383544921875, 0.005755424499511719, 0.00830841064453125, 0.010861396789550781, 0.013414382934570312, 0.015967369079589844, 0.018520355224609375, 0.021073341369628906, 0.023626327514648438, 0.02617931365966797, 0.0287322998046875, 0.03128528594970703, 0.03383827209472656, 0.036391258239746094, 0.038944244384765625, 0.041497230529785156, 0.04405021667480469, 0.04660320281982422, 0.04915618896484375, 0.05170917510986328, 0.05426216125488281, 0.056815147399902344, 0.059368133544921875, 0.061921119689941406, 0.06447410583496094, 0.06702709197998047, 0.069580078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 10.0, 13.0, 21.0, 21.0, 26.0, 45.0, 77.0, 118.0, 212.0, 339.0, 565.0, 1125.0, 2145.0, 5032.0, 13199.0, 36837.0, 106619.0, 265437.0, 357819.0, 164853.0, 58904.0, 20598.0, 7855.0, 3243.0, 1464.0, 798.0, 419.0, 258.0, 162.0, 103.0, 65.0, 50.0, 36.0, 28.0, 15.0, 7.0, 6.0, 4.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.05660581588745117, -0.054526329040527344, -0.052446842193603516, -0.05036735534667969, -0.04828786849975586, -0.04620838165283203, -0.0441288948059082, -0.042049407958984375, -0.03996992111206055, -0.03789043426513672, -0.03581094741821289, -0.03373146057128906, -0.031651973724365234, -0.029572486877441406, -0.027493000030517578, -0.02541351318359375, -0.023334026336669922, -0.021254539489746094, -0.019175052642822266, -0.017095565795898438, -0.01501607894897461, -0.012936592102050781, -0.010857105255126953, -0.008777618408203125, -0.006698131561279297, -0.004618644714355469, -0.0025391578674316406, -0.0004596710205078125, 0.0016198158264160156, 0.0036993026733398438, 0.005778789520263672, 0.0078582763671875, 0.009937763214111328, 0.012017250061035156, 0.014096736907958984, 0.016176223754882812, 0.01825571060180664, 0.02033519744873047, 0.022414684295654297, 0.024494171142578125, 0.026573657989501953, 0.02865314483642578, 0.03073263168334961, 0.03281211853027344, 0.034891605377197266, 0.036971092224121094, 0.03905057907104492, 0.04113006591796875, 0.04320955276489258, 0.045289039611816406, 0.047368526458740234, 0.04944801330566406, 0.05152750015258789, 0.05360698699951172, 0.05568647384643555, 0.057765960693359375, 0.0598454475402832, 0.06192493438720703, 0.06400442123413086, 0.06608390808105469, 0.06816339492797852, 0.07024288177490234, 0.07232236862182617, 0.07440185546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 5.0, 10.0, 8.0, 8.0, 20.0, 15.0, 19.0, 26.0, 33.0, 26.0, 35.0, 38.0, 48.0, 45.0, 52.0, 50.0, 51.0, 48.0, 46.0, 46.0, 44.0, 46.0, 50.0, 30.0, 37.0, 26.0, 20.0, 25.0, 13.0, 10.0, 14.0, 12.0, 10.0, 7.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.110107421875, -0.10626220703125, -0.1024169921875, -0.09857177734375, -0.0947265625, -0.09088134765625, -0.0870361328125, -0.08319091796875, -0.079345703125, -0.07550048828125, -0.0716552734375, -0.06781005859375, -0.06396484375, -0.06011962890625, -0.0562744140625, -0.05242919921875, -0.048583984375, -0.04473876953125, -0.0408935546875, -0.03704833984375, -0.033203125, -0.02935791015625, -0.0255126953125, -0.02166748046875, -0.017822265625, -0.01397705078125, -0.0101318359375, -0.00628662109375, -0.00244140625, 0.00140380859375, 0.0052490234375, 0.00909423828125, 0.012939453125, 0.01678466796875, 0.0206298828125, 0.02447509765625, 0.0283203125, 0.03216552734375, 0.0360107421875, 0.03985595703125, 0.043701171875, 0.04754638671875, 0.0513916015625, 0.05523681640625, 0.05908203125, 0.06292724609375, 0.0667724609375, 0.07061767578125, 0.074462890625, 0.07830810546875, 0.0821533203125, 0.08599853515625, 0.08984375, 0.09368896484375, 0.0975341796875, 0.10137939453125, 0.105224609375, 0.10906982421875, 0.1129150390625, 0.11676025390625, 0.12060546875, 0.12445068359375, 0.1282958984375, 0.13214111328125, 0.135986328125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 9.0, 18.0, 20.0, 39.0, 45.0, 91.0, 118.0, 175.0, 272.0, 433.0, 841.0, 1568.0, 3582.0, 9363.0, 28072.0, 94595.0, 303070.0, 405364.0, 138165.0, 40845.0, 12833.0, 4597.0, 2022.0, 991.0, 548.0, 294.0, 203.0, 119.0, 70.0, 58.0, 38.0, 24.0, 15.0, 10.0, 10.0, 6.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01788330078125, -0.017327070236206055, -0.01677083969116211, -0.016214609146118164, -0.01565837860107422, -0.015102148056030273, -0.014545917510986328, -0.013989686965942383, -0.013433456420898438, -0.012877225875854492, -0.012320995330810547, -0.011764764785766602, -0.011208534240722656, -0.010652303695678711, -0.010096073150634766, -0.00953984260559082, -0.008983612060546875, -0.00842738151550293, -0.007871150970458984, -0.007314920425415039, -0.006758689880371094, -0.0062024593353271484, -0.005646228790283203, -0.005089998245239258, -0.0045337677001953125, -0.003977537155151367, -0.003421306610107422, -0.0028650760650634766, -0.0023088455200195312, -0.001752614974975586, -0.0011963844299316406, -0.0006401538848876953, -8.392333984375e-05, 0.0004723072052001953, 0.0010285377502441406, 0.001584768295288086, 0.0021409988403320312, 0.0026972293853759766, 0.003253459930419922, 0.003809690475463867, 0.0043659210205078125, 0.004922151565551758, 0.005478382110595703, 0.0060346126556396484, 0.006590843200683594, 0.007147073745727539, 0.007703304290771484, 0.00825953483581543, 0.008815765380859375, 0.00937199592590332, 0.009928226470947266, 0.010484457015991211, 0.011040687561035156, 0.011596918106079102, 0.012153148651123047, 0.012709379196166992, 0.013265609741210938, 0.013821840286254883, 0.014378070831298828, 0.014934301376342773, 0.015490531921386719, 0.016046762466430664, 0.01660299301147461, 0.017159223556518555, 0.0177154541015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 7.0, 12.0, 8.0, 17.0, 20.0, 20.0, 32.0, 33.0, 31.0, 45.0, 53.0, 55.0, 70.0, 91.0, 67.0, 49.0, 57.0, 64.0, 51.0, 40.0, 32.0, 28.0, 25.0, 15.0, 17.0, 8.0, 6.0, 7.0, 0.0, 4.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-8.106231689453125e-06, -7.860362529754639e-06, -7.614493370056152e-06, -7.368624210357666e-06, -7.12275505065918e-06, -6.876885890960693e-06, -6.631016731262207e-06, -6.385147571563721e-06, -6.139278411865234e-06, -5.893409252166748e-06, -5.647540092468262e-06, -5.401670932769775e-06, -5.155801773071289e-06, -4.909932613372803e-06, -4.664063453674316e-06, -4.41819429397583e-06, -4.172325134277344e-06, -3.926455974578857e-06, -3.680586814880371e-06, -3.4347176551818848e-06, -3.1888484954833984e-06, -2.942979335784912e-06, -2.6971101760864258e-06, -2.4512410163879395e-06, -2.205371856689453e-06, -1.959502696990967e-06, -1.7136335372924805e-06, -1.4677643775939941e-06, -1.2218952178955078e-06, -9.760260581970215e-07, -7.301568984985352e-07, -4.842877388000488e-07, -2.384185791015625e-07, 7.450580596923828e-09, 2.5331974029541016e-07, 4.991888999938965e-07, 7.450580596923828e-07, 9.909272193908691e-07, 1.2367963790893555e-06, 1.4826655387878418e-06, 1.7285346984863281e-06, 1.9744038581848145e-06, 2.2202730178833008e-06, 2.466142177581787e-06, 2.7120113372802734e-06, 2.9578804969787598e-06, 3.203749656677246e-06, 3.4496188163757324e-06, 3.6954879760742188e-06, 3.941357135772705e-06, 4.187226295471191e-06, 4.433095455169678e-06, 4.678964614868164e-06, 4.92483377456665e-06, 5.170702934265137e-06, 5.416572093963623e-06, 5.662441253662109e-06, 5.908310413360596e-06, 6.154179573059082e-06, 6.400048732757568e-06, 6.645917892456055e-06, 6.891787052154541e-06, 7.137656211853027e-06, 7.383525371551514e-06, 7.62939453125e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 12.0, 9.0, 14.0, 18.0, 19.0, 51.0, 53.0, 61.0, 95.0, 164.0, 234.0, 349.0, 521.0, 865.0, 1388.0, 2544.0, 4936.0, 10937.0, 27556.0, 74824.0, 197016.0, 368370.0, 218037.0, 85216.0, 31073.0, 12063.0, 5278.0, 2679.0, 1526.0, 923.0, 554.0, 377.0, 234.0, 159.0, 109.0, 63.0, 66.0, 41.0, 31.0, 15.0, 11.0, 10.0, 7.0, 10.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.0178680419921875, -0.01733565330505371, -0.016803264617919922, -0.016270875930786133, -0.015738487243652344, -0.015206098556518555, -0.014673709869384766, -0.014141321182250977, -0.013608932495117188, -0.013076543807983398, -0.01254415512084961, -0.01201176643371582, -0.011479377746582031, -0.010946989059448242, -0.010414600372314453, -0.009882211685180664, -0.009349822998046875, -0.008817434310913086, -0.008285045623779297, -0.007752656936645508, -0.007220268249511719, -0.00668787956237793, -0.006155490875244141, -0.0056231021881103516, -0.0050907135009765625, -0.0045583248138427734, -0.004025936126708984, -0.0034935474395751953, -0.0029611587524414062, -0.002428770065307617, -0.0018963813781738281, -0.001363992691040039, -0.00083160400390625, -0.00029921531677246094, 0.00023317337036132812, 0.0007655620574951172, 0.0012979507446289062, 0.0018303394317626953, 0.0023627281188964844, 0.0028951168060302734, 0.0034275054931640625, 0.0039598941802978516, 0.004492282867431641, 0.00502467155456543, 0.005557060241699219, 0.006089448928833008, 0.006621837615966797, 0.007154226303100586, 0.007686614990234375, 0.008219003677368164, 0.008751392364501953, 0.009283781051635742, 0.009816169738769531, 0.01034855842590332, 0.01088094711303711, 0.011413335800170898, 0.011945724487304688, 0.012478113174438477, 0.013010501861572266, 0.013542890548706055, 0.014075279235839844, 0.014607667922973633, 0.015140056610107422, 0.01567244529724121, 0.016204833984375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 9.0, 8.0, 8.0, 18.0, 14.0, 22.0, 36.0, 32.0, 60.0, 73.0, 68.0, 84.0, 90.0, 91.0, 80.0, 71.0, 40.0, 40.0, 39.0, 25.0, 18.0, 15.0, 12.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.024169921875, -0.02344655990600586, -0.02272319793701172, -0.021999835968017578, -0.021276473999023438, -0.020553112030029297, -0.019829750061035156, -0.019106388092041016, -0.018383026123046875, -0.017659664154052734, -0.016936302185058594, -0.016212940216064453, -0.015489578247070312, -0.014766216278076172, -0.014042854309082031, -0.01331949234008789, -0.01259613037109375, -0.01187276840209961, -0.011149406433105469, -0.010426044464111328, -0.009702682495117188, -0.008979320526123047, -0.008255958557128906, -0.007532596588134766, -0.006809234619140625, -0.006085872650146484, -0.005362510681152344, -0.004639148712158203, -0.0039157867431640625, -0.003192424774169922, -0.0024690628051757812, -0.0017457008361816406, -0.0010223388671875, -0.0002989768981933594, 0.00042438507080078125, 0.0011477470397949219, 0.0018711090087890625, 0.002594470977783203, 0.0033178329467773438, 0.004041194915771484, 0.004764556884765625, 0.005487918853759766, 0.006211280822753906, 0.006934642791748047, 0.0076580047607421875, 0.008381366729736328, 0.009104728698730469, 0.00982809066772461, 0.01055145263671875, 0.01127481460571289, 0.011998176574707031, 0.012721538543701172, 0.013444900512695312, 0.014168262481689453, 0.014891624450683594, 0.015614986419677734, 0.016338348388671875, 0.017061710357666016, 0.017785072326660156, 0.018508434295654297, 0.019231796264648438, 0.019955158233642578, 0.02067852020263672, 0.02140188217163086, 0.022125244140625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 12.0, 32.0, 105.0, 163.0, 262.0, 213.0, 104.0, 59.0, 18.0, 20.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2807014584541321, -0.2583438456058502, -0.23598623275756836, -0.2136286050081253, -0.19127099215984344, -0.16891337931156158, -0.14655575156211853, -0.12419813871383667, -0.10184052586555481, -0.07948291301727295, -0.05712529271841049, -0.034767672419548035, -0.012410059571266174, 0.009947553277015686, 0.03230518102645874, 0.0546627938747406, 0.07702040672302246, 0.09937801957130432, 0.12173563987016678, 0.14409326016902924, 0.1664508730173111, 0.18880848586559296, 0.211166113615036, 0.23352372646331787, 0.25588133931159973, 0.2782389521598816, 0.30059656500816345, 0.3229541778564453, 0.34531182050704956, 0.36766940355300903, 0.3900270462036133, 0.41238465905189514, 0.4347423315048218, 0.45709994435310364, 0.4794575572013855, 0.5018151998519897, 0.5241727828979492, 0.5465304255485535, 0.5688880681991577, 0.5912456512451172, 0.6136032342910767, 0.6359608769416809, 0.6583184599876404, 0.6806761026382446, 0.7030336856842041, 0.7253913283348083, 0.7477489709854126, 0.7701065540313721, 0.7924641966819763, 0.8148218393325806, 0.83717942237854, 0.8595370650291443, 0.8818946480751038, 0.904252290725708, 0.9266098737716675, 0.9489675164222717, 0.971325159072876, 0.9936828017234802, 1.0160404443740845, 1.038398027420044, 1.0607556104660034, 1.083113193511963, 1.105470895767212, 1.1278284788131714, 1.1501860618591309]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 8.0, 7.0, 9.0, 4.0, 4.0, 8.0, 16.0, 11.0, 25.0, 23.0, 24.0, 30.0, 36.0, 34.0, 44.0, 40.0, 42.0, 37.0, 50.0, 54.0, 52.0, 42.0, 34.0, 40.0, 42.0, 31.0, 36.0, 30.0, 28.0, 27.0, 24.0, 24.0, 20.0, 8.0, 12.0, 9.0, 9.0, 9.0, 5.0, 8.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2755107879638672, -0.2669037878513336, -0.25829681754112244, -0.24968981742858887, -0.2410828322172165, -0.23247584700584412, -0.22386884689331055, -0.21526186168193817, -0.2066548764705658, -0.19804789125919342, -0.18944089114665985, -0.18083390593528748, -0.1722269207239151, -0.16361993551254272, -0.15501293540000916, -0.14640595018863678, -0.1377989500761032, -0.12919196486473083, -0.12058497220277786, -0.11197797954082489, -0.10337099432945251, -0.09476400166749954, -0.08615700900554657, -0.0775500237941742, -0.06894303113222122, -0.06033604219555855, -0.051729053258895874, -0.0431220605969429, -0.03451507166028023, -0.025908082723617554, -0.01730109006166458, -0.008694101125001907, -8.71121883392334e-05, 0.008519877679646015, 0.017126867547631264, 0.025733858346939087, 0.03434084728360176, 0.042947836220264435, 0.05155482888221741, 0.06016181781888008, 0.06876880675554276, 0.07737579941749573, 0.0859827846288681, 0.09458977729082108, 0.10319676995277405, 0.11180375516414642, 0.1204107478260994, 0.12901774048805237, 0.13762472569942474, 0.14623171091079712, 0.1548387110233307, 0.16344569623470306, 0.17205268144607544, 0.180659681558609, 0.18926666676998138, 0.19787365198135376, 0.20648065209388733, 0.2150876373052597, 0.22369463741779327, 0.23230162262916565, 0.24090860784053802, 0.2495155930519104, 0.25812259316444397, 0.26672959327697754, 0.2753365635871887]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 14.0, 23.0, 39.0, 59.0, 91.0, 206.0, 359.0, 814.0, 2130.0, 6943.0, 20500.0, 100401.0, 725359.0, 2063584.0, 1066872.0, 166484.0, 27039.0, 7494.0, 3362.0, 1391.0, 504.0, 245.0, 129.0, 83.0, 53.0, 37.0, 20.0, 16.0, 6.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08966064453125, -0.08721256256103516, -0.08476448059082031, -0.08231639862060547, -0.07986831665039062, -0.07742023468017578, -0.07497215270996094, -0.0725240707397461, -0.07007598876953125, -0.0676279067993164, -0.06517982482910156, -0.06273174285888672, -0.060283660888671875, -0.05783557891845703, -0.05538749694824219, -0.052939414978027344, -0.0504913330078125, -0.048043251037597656, -0.04559516906738281, -0.04314708709716797, -0.040699005126953125, -0.03825092315673828, -0.03580284118652344, -0.033354759216308594, -0.03090667724609375, -0.028458595275878906, -0.026010513305664062, -0.02356243133544922, -0.021114349365234375, -0.01866626739501953, -0.016218185424804688, -0.013770103454589844, -0.011322021484375, -0.008873939514160156, -0.0064258575439453125, -0.003977775573730469, -0.001529693603515625, 0.0009183883666992188, 0.0033664703369140625, 0.005814552307128906, 0.00826263427734375, 0.010710716247558594, 0.013158798217773438, 0.015606880187988281, 0.018054962158203125, 0.02050304412841797, 0.022951126098632812, 0.025399208068847656, 0.0278472900390625, 0.030295372009277344, 0.03274345397949219, 0.03519153594970703, 0.037639617919921875, 0.04008769989013672, 0.04253578186035156, 0.044983863830566406, 0.04743194580078125, 0.049880027770996094, 0.05232810974121094, 0.05477619171142578, 0.057224273681640625, 0.05967235565185547, 0.06212043762207031, 0.06456851959228516, 0.0670166015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 7.0, 9.0, 20.0, 35.0, 50.0, 56.0, 69.0, 81.0, 83.0, 102.0, 108.0, 102.0, 94.0, 53.0, 44.0, 37.0, 26.0, 12.0, 10.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09429931640625, -0.09172725677490234, -0.08915519714355469, -0.08658313751220703, -0.08401107788085938, -0.08143901824951172, -0.07886695861816406, -0.0762948989868164, -0.07372283935546875, -0.0711507797241211, -0.06857872009277344, -0.06600666046142578, -0.06343460083007812, -0.06086254119873047, -0.05829048156738281, -0.055718421936035156, -0.0531463623046875, -0.050574302673339844, -0.04800224304199219, -0.04543018341064453, -0.042858123779296875, -0.04028606414794922, -0.03771400451660156, -0.035141944885253906, -0.03256988525390625, -0.029997825622558594, -0.027425765991210938, -0.02485370635986328, -0.022281646728515625, -0.01970958709716797, -0.017137527465820312, -0.014565467834472656, -0.011993408203125, -0.009421348571777344, -0.0068492889404296875, -0.004277229309082031, -0.001705169677734375, 0.0008668899536132812, 0.0034389495849609375, 0.006011009216308594, 0.00858306884765625, 0.011155128479003906, 0.013727188110351562, 0.01629924774169922, 0.018871307373046875, 0.02144336700439453, 0.024015426635742188, 0.026587486267089844, 0.0291595458984375, 0.031731605529785156, 0.03430366516113281, 0.03687572479248047, 0.039447784423828125, 0.04201984405517578, 0.04459190368652344, 0.047163963317871094, 0.04973602294921875, 0.052308082580566406, 0.05488014221191406, 0.05745220184326172, 0.060024261474609375, 0.06259632110595703, 0.06516838073730469, 0.06774044036865234, 0.0703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 1.0, 3.0, 7.0, 16.0, 11.0, 20.0, 18.0, 38.0, 57.0, 96.0, 163.0, 289.0, 629.0, 1457.0, 4296.0, 21030.0, 342477.0, 3619529.0, 182551.0, 15549.0, 3587.0, 1285.0, 526.0, 272.0, 133.0, 85.0, 49.0, 32.0, 19.0, 16.0, 16.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.117431640625, -0.11262130737304688, -0.10781097412109375, -0.10300064086914062, -0.0981903076171875, -0.09337997436523438, -0.08856964111328125, -0.08375930786132812, -0.078948974609375, -0.07413864135742188, -0.06932830810546875, -0.06451797485351562, -0.0597076416015625, -0.054897308349609375, -0.05008697509765625, -0.045276641845703125, -0.04046630859375, -0.035655975341796875, -0.03084564208984375, -0.026035308837890625, -0.0212249755859375, -0.016414642333984375, -0.01160430908203125, -0.006793975830078125, -0.001983642578125, 0.002826690673828125, 0.00763702392578125, 0.012447357177734375, 0.0172576904296875, 0.022068023681640625, 0.02687835693359375, 0.031688690185546875, 0.0364990234375, 0.041309356689453125, 0.04611968994140625, 0.050930023193359375, 0.0557403564453125, 0.060550689697265625, 0.06536102294921875, 0.07017135620117188, 0.074981689453125, 0.07979202270507812, 0.08460235595703125, 0.08941268920898438, 0.0942230224609375, 0.09903335571289062, 0.10384368896484375, 0.10865402221679688, 0.11346435546875, 0.11827468872070312, 0.12308502197265625, 0.12789535522460938, 0.1327056884765625, 0.13751602172851562, 0.14232635498046875, 0.14713668823242188, 0.151947021484375, 0.15675735473632812, 0.16156768798828125, 0.16637802124023438, 0.1711883544921875, 0.17599868774414062, 0.18080902099609375, 0.18561935424804688, 0.1904296875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 9.0, 16.0, 8.0, 23.0, 50.0, 61.0, 65.0, 80.0, 90.0, 139.0, 189.0, 241.0, 351.0, 332.0, 409.0, 425.0, 363.0, 308.0, 210.0, 168.0, 163.0, 96.0, 56.0, 60.0, 49.0, 25.0, 21.0, 24.0, 15.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09405517578125, -0.09150409698486328, -0.08895301818847656, -0.08640193939208984, -0.08385086059570312, -0.0812997817993164, -0.07874870300292969, -0.07619762420654297, -0.07364654541015625, -0.07109546661376953, -0.06854438781738281, -0.0659933090209961, -0.06344223022460938, -0.060891151428222656, -0.05834007263183594, -0.05578899383544922, -0.0532379150390625, -0.05068683624267578, -0.04813575744628906, -0.045584678649902344, -0.043033599853515625, -0.040482521057128906, -0.03793144226074219, -0.03538036346435547, -0.03282928466796875, -0.03027820587158203, -0.027727127075195312, -0.025176048278808594, -0.022624969482421875, -0.020073890686035156, -0.017522811889648438, -0.014971733093261719, -0.012420654296875, -0.009869575500488281, -0.0073184967041015625, -0.004767417907714844, -0.002216339111328125, 0.00033473968505859375, 0.0028858184814453125, 0.005436897277832031, 0.00798797607421875, 0.010539054870605469, 0.013090133666992188, 0.015641212463378906, 0.018192291259765625, 0.020743370056152344, 0.023294448852539062, 0.02584552764892578, 0.0283966064453125, 0.03094768524169922, 0.03349876403808594, 0.036049842834472656, 0.038600921630859375, 0.041152000427246094, 0.04370307922363281, 0.04625415802001953, 0.04880523681640625, 0.05135631561279297, 0.05390739440917969, 0.056458473205566406, 0.059009552001953125, 0.061560630798339844, 0.06411170959472656, 0.06666278839111328, 0.0692138671875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 10.0, 16.0, 16.0, 36.0, 43.0, 63.0, 86.0, 117.0, 121.0, 138.0, 116.0, 75.0, 42.0, 23.0, 27.0, 16.0, 13.0, 10.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0513836145401, -1.0201712846755981, -0.9889589548110962, -0.9577466249465942, -0.9265342950820923, -0.8953219652175903, -0.8641096353530884, -0.8328973054885864, -0.8016849756240845, -0.7704726457595825, -0.7392603158950806, -0.7080479860305786, -0.6768356561660767, -0.6456233263015747, -0.6144109964370728, -0.5831986665725708, -0.5519863367080688, -0.5207740068435669, -0.48956167697906494, -0.458349347114563, -0.42713701725006104, -0.3959246873855591, -0.36471235752105713, -0.3335000276565552, -0.3022876977920532, -0.27107536792755127, -0.23986303806304932, -0.20865070819854736, -0.1774383783340454, -0.14622604846954346, -0.1150137186050415, -0.08380138874053955, -0.05258899927139282, -0.02137666940689087, 0.009835660457611084, 0.04104799032211304, 0.07226032018661499, 0.10347265005111694, 0.1346849799156189, 0.16589730978012085, 0.1971096396446228, 0.22832196950912476, 0.2595342993736267, 0.29074662923812866, 0.3219589591026306, 0.35317128896713257, 0.3843836188316345, 0.4155959486961365, 0.4468082785606384, 0.4780206084251404, 0.5092329382896423, 0.5404452681541443, 0.5716575980186462, 0.6028699278831482, 0.6340822577476501, 0.6652945876121521, 0.696506917476654, 0.727719247341156, 0.758931577205658, 0.7901439070701599, 0.8213562369346619, 0.8525685667991638, 0.8837808966636658, 0.9149932265281677, 0.9462055563926697]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 8.0, 6.0, 1.0, 7.0, 18.0, 13.0, 17.0, 25.0, 23.0, 19.0, 33.0, 43.0, 45.0, 25.0, 55.0, 40.0, 54.0, 49.0, 46.0, 40.0, 49.0, 51.0, 52.0, 35.0, 31.0, 33.0, 29.0, 26.0, 19.0, 19.0, 22.0, 19.0, 12.0, 4.0, 7.0, 7.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29340970516204834, -0.28261226415634155, -0.27181482315063477, -0.26101741194725037, -0.2502199709415436, -0.2394225299358368, -0.2286251038312912, -0.2178276777267456, -0.20703023672103882, -0.19623279571533203, -0.18543536961078644, -0.17463794350624084, -0.16384050250053406, -0.15304306149482727, -0.14224563539028168, -0.13144820928573608, -0.1206507682800293, -0.1098533347249031, -0.09905590116977692, -0.08825846761465073, -0.07746103405952454, -0.06666360050439835, -0.055866166949272156, -0.045068733394145966, -0.034271299839019775, -0.023473866283893585, -0.012676432728767395, -0.0018789991736412048, 0.008918434381484985, 0.019715867936611176, 0.030513301491737366, 0.041310735046863556, 0.052108168601989746, 0.06290560215711594, 0.07370303571224213, 0.08450046926736832, 0.0952979028224945, 0.1060953363776207, 0.11689276993274689, 0.12769019603729248, 0.13848763704299927, 0.14928507804870605, 0.16008250415325165, 0.17087993025779724, 0.18167737126350403, 0.19247481226921082, 0.2032722383737564, 0.214069664478302, 0.2248671054840088, 0.23566454648971558, 0.24646197259426117, 0.25725939869880676, 0.26805683970451355, 0.27885428071022034, 0.28965169191360474, 0.3004491329193115, 0.3112465739250183, 0.3220440149307251, 0.3328414559364319, 0.3436388671398163, 0.35443630814552307, 0.36523374915122986, 0.37603116035461426, 0.38682860136032104, 0.39762604236602783]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 1.0, 1.0, 4.0, 9.0, 9.0, 13.0, 23.0, 29.0, 44.0, 46.0, 90.0, 161.0, 249.0, 443.0, 779.0, 1523.0, 3381.0, 8768.0, 29714.0, 182452.0, 656370.0, 127358.0, 23610.0, 7318.0, 2978.0, 1410.0, 714.0, 393.0, 259.0, 156.0, 85.0, 49.0, 42.0, 17.0, 24.0, 9.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0767822265625, -0.07425785064697266, -0.07173347473144531, -0.06920909881591797, -0.06668472290039062, -0.06416034698486328, -0.06163597106933594, -0.059111595153808594, -0.05658721923828125, -0.054062843322753906, -0.05153846740722656, -0.04901409149169922, -0.046489715576171875, -0.04396533966064453, -0.04144096374511719, -0.038916587829589844, -0.0363922119140625, -0.033867835998535156, -0.03134346008300781, -0.02881908416748047, -0.026294708251953125, -0.02377033233642578, -0.021245956420898438, -0.018721580505371094, -0.01619720458984375, -0.013672828674316406, -0.011148452758789062, -0.008624076843261719, -0.006099700927734375, -0.0035753250122070312, -0.0010509490966796875, 0.0014734268188476562, 0.003997802734375, 0.006522178649902344, 0.009046554565429688, 0.011570930480957031, 0.014095306396484375, 0.01661968231201172, 0.019144058227539062, 0.021668434143066406, 0.02419281005859375, 0.026717185974121094, 0.029241561889648438, 0.03176593780517578, 0.034290313720703125, 0.03681468963623047, 0.03933906555175781, 0.041863441467285156, 0.0443878173828125, 0.046912193298339844, 0.04943656921386719, 0.05196094512939453, 0.054485321044921875, 0.05700969696044922, 0.05953407287597656, 0.062058448791503906, 0.06458282470703125, 0.0671072006225586, 0.06963157653808594, 0.07215595245361328, 0.07468032836914062, 0.07720470428466797, 0.07972908020019531, 0.08225345611572266, 0.08477783203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 8.0, 15.0, 21.0, 25.0, 40.0, 52.0, 76.0, 71.0, 88.0, 75.0, 69.0, 87.0, 91.0, 69.0, 56.0, 39.0, 32.0, 27.0, 15.0, 11.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.098876953125, -0.09598731994628906, -0.09309768676757812, -0.09020805358886719, -0.08731842041015625, -0.08442878723144531, -0.08153915405273438, -0.07864952087402344, -0.0757598876953125, -0.07287025451660156, -0.06998062133789062, -0.06709098815917969, -0.06420135498046875, -0.06131172180175781, -0.058422088623046875, -0.05553245544433594, -0.052642822265625, -0.04975318908691406, -0.046863555908203125, -0.04397392272949219, -0.04108428955078125, -0.03819465637207031, -0.035305023193359375, -0.03241539001464844, -0.0295257568359375, -0.026636123657226562, -0.023746490478515625, -0.020856857299804688, -0.01796722412109375, -0.015077590942382812, -0.012187957763671875, -0.009298324584960938, -0.00640869140625, -0.0035190582275390625, -0.000629425048828125, 0.0022602081298828125, 0.00514984130859375, 0.008039474487304688, 0.010929107666015625, 0.013818740844726562, 0.0167083740234375, 0.019598007202148438, 0.022487640380859375, 0.025377273559570312, 0.02826690673828125, 0.031156539916992188, 0.034046173095703125, 0.03693580627441406, 0.039825439453125, 0.04271507263183594, 0.045604705810546875, 0.04849433898925781, 0.05138397216796875, 0.05427360534667969, 0.057163238525390625, 0.06005287170410156, 0.0629425048828125, 0.06583213806152344, 0.06872177124023438, 0.07161140441894531, 0.07450103759765625, 0.07739067077636719, 0.08028030395507812, 0.08316993713378906, 0.0860595703125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 10.0, 10.0, 18.0, 42.0, 55.0, 104.0, 215.0, 364.0, 844.0, 2355.0, 8721.0, 63832.0, 777008.0, 172139.0, 16969.0, 3599.0, 1238.0, 493.0, 205.0, 128.0, 63.0, 56.0, 26.0, 11.0, 14.0, 9.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.10028076171875, -0.09775400161743164, -0.09522724151611328, -0.09270048141479492, -0.09017372131347656, -0.0876469612121582, -0.08512020111083984, -0.08259344100952148, -0.08006668090820312, -0.07753992080688477, -0.0750131607055664, -0.07248640060424805, -0.06995964050292969, -0.06743288040161133, -0.06490612030029297, -0.06237936019897461, -0.05985260009765625, -0.05732583999633789, -0.05479907989501953, -0.05227231979370117, -0.04974555969238281, -0.04721879959106445, -0.044692039489746094, -0.042165279388427734, -0.039638519287109375, -0.037111759185791016, -0.034584999084472656, -0.0320582389831543, -0.029531478881835938, -0.027004718780517578, -0.02447795867919922, -0.02195119857788086, -0.0194244384765625, -0.01689767837524414, -0.014370918273925781, -0.011844158172607422, -0.009317398071289062, -0.006790637969970703, -0.004263877868652344, -0.0017371177673339844, 0.000789642333984375, 0.0033164024353027344, 0.005843162536621094, 0.008369922637939453, 0.010896682739257812, 0.013423442840576172, 0.01595020294189453, 0.01847696304321289, 0.02100372314453125, 0.02353048324584961, 0.02605724334716797, 0.028584003448486328, 0.031110763549804688, 0.03363752365112305, 0.036164283752441406, 0.038691043853759766, 0.041217803955078125, 0.043744564056396484, 0.046271324157714844, 0.0487980842590332, 0.05132484436035156, 0.05385160446166992, 0.05637836456298828, 0.05890512466430664, 0.061431884765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 9.0, 10.0, 9.0, 11.0, 21.0, 13.0, 25.0, 21.0, 29.0, 30.0, 39.0, 33.0, 42.0, 55.0, 70.0, 75.0, 59.0, 46.0, 62.0, 58.0, 43.0, 25.0, 40.0, 38.0, 29.0, 21.0, 17.0, 15.0, 13.0, 13.0, 3.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12200927734375, -0.11821651458740234, -0.11442375183105469, -0.11063098907470703, -0.10683822631835938, -0.10304546356201172, -0.09925270080566406, -0.0954599380493164, -0.09166717529296875, -0.0878744125366211, -0.08408164978027344, -0.08028888702392578, -0.07649612426757812, -0.07270336151123047, -0.06891059875488281, -0.06511783599853516, -0.0613250732421875, -0.057532310485839844, -0.05373954772949219, -0.04994678497314453, -0.046154022216796875, -0.04236125946044922, -0.03856849670410156, -0.034775733947753906, -0.03098297119140625, -0.027190208435058594, -0.023397445678710938, -0.01960468292236328, -0.015811920166015625, -0.012019157409667969, -0.008226394653320312, -0.004433631896972656, -0.000640869140625, 0.0031518936157226562, 0.0069446563720703125, 0.010737419128417969, 0.014530181884765625, 0.01832294464111328, 0.022115707397460938, 0.025908470153808594, 0.02970123291015625, 0.033493995666503906, 0.03728675842285156, 0.04107952117919922, 0.044872283935546875, 0.04866504669189453, 0.05245780944824219, 0.056250572204589844, 0.0600433349609375, 0.06383609771728516, 0.06762886047363281, 0.07142162322998047, 0.07521438598632812, 0.07900714874267578, 0.08279991149902344, 0.0865926742553711, 0.09038543701171875, 0.0941781997680664, 0.09797096252441406, 0.10176372528076172, 0.10555648803710938, 0.10934925079345703, 0.11314201354980469, 0.11693477630615234, 0.1207275390625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 6.0, 4.0, 6.0, 5.0, 18.0, 18.0, 28.0, 64.0, 77.0, 162.0, 374.0, 925.0, 3720.0, 27916.0, 780855.0, 219423.0, 11621.0, 2065.0, 639.0, 260.0, 131.0, 71.0, 36.0, 33.0, 16.0, 16.0, 14.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0218963623046875, -0.02110910415649414, -0.02032184600830078, -0.019534587860107422, -0.018747329711914062, -0.017960071563720703, -0.017172813415527344, -0.016385555267333984, -0.015598297119140625, -0.014811038970947266, -0.014023780822753906, -0.013236522674560547, -0.012449264526367188, -0.011662006378173828, -0.010874748229980469, -0.01008749008178711, -0.00930023193359375, -0.00851297378540039, -0.007725715637207031, -0.006938457489013672, -0.0061511993408203125, -0.005363941192626953, -0.004576683044433594, -0.0037894248962402344, -0.003002166748046875, -0.0022149085998535156, -0.0014276504516601562, -0.0006403923034667969, 0.0001468658447265625, 0.0009341239929199219, 0.0017213821411132812, 0.0025086402893066406, 0.0032958984375, 0.004083156585693359, 0.004870414733886719, 0.005657672882080078, 0.0064449310302734375, 0.007232189178466797, 0.008019447326660156, 0.008806705474853516, 0.009593963623046875, 0.010381221771240234, 0.011168479919433594, 0.011955738067626953, 0.012742996215820312, 0.013530254364013672, 0.014317512512207031, 0.01510477066040039, 0.01589202880859375, 0.01667928695678711, 0.01746654510498047, 0.018253803253173828, 0.019041061401367188, 0.019828319549560547, 0.020615577697753906, 0.021402835845947266, 0.022190093994140625, 0.022977352142333984, 0.023764610290527344, 0.024551868438720703, 0.025339126586914062, 0.026126384735107422, 0.02691364288330078, 0.02770090103149414, 0.0284881591796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 5.0, 9.0, 18.0, 21.0, 24.0, 26.0, 35.0, 31.0, 35.0, 43.0, 50.0, 94.0, 71.0, 54.0, 56.0, 52.0, 54.0, 48.0, 56.0, 35.0, 36.0, 25.0, 23.0, 13.0, 15.0, 16.0, 17.0, 8.0, 6.0, 4.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.377696990966797e-06, -6.195157766342163e-06, -6.012618541717529e-06, -5.8300793170928955e-06, -5.647540092468262e-06, -5.465000867843628e-06, -5.282461643218994e-06, -5.09992241859436e-06, -4.9173831939697266e-06, -4.734843969345093e-06, -4.552304744720459e-06, -4.369765520095825e-06, -4.187226295471191e-06, -4.004687070846558e-06, -3.822147846221924e-06, -3.63960862159729e-06, -3.4570693969726562e-06, -3.2745301723480225e-06, -3.0919909477233887e-06, -2.909451723098755e-06, -2.726912498474121e-06, -2.5443732738494873e-06, -2.3618340492248535e-06, -2.1792948246002197e-06, -1.996755599975586e-06, -1.8142163753509521e-06, -1.6316771507263184e-06, -1.4491379261016846e-06, -1.2665987014770508e-06, -1.084059476852417e-06, -9.015202522277832e-07, -7.189810276031494e-07, -5.364418029785156e-07, -3.5390257835388184e-07, -1.7136335372924805e-07, 1.1175870895385742e-08, 1.9371509552001953e-07, 3.762543201446533e-07, 5.587935447692871e-07, 7.413327693939209e-07, 9.238719940185547e-07, 1.1064112186431885e-06, 1.2889504432678223e-06, 1.471489667892456e-06, 1.6540288925170898e-06, 1.8365681171417236e-06, 2.0191073417663574e-06, 2.201646566390991e-06, 2.384185791015625e-06, 2.566725015640259e-06, 2.7492642402648926e-06, 2.9318034648895264e-06, 3.11434268951416e-06, 3.296881914138794e-06, 3.4794211387634277e-06, 3.6619603633880615e-06, 3.844499588012695e-06, 4.027038812637329e-06, 4.209578037261963e-06, 4.392117261886597e-06, 4.5746564865112305e-06, 4.757195711135864e-06, 4.939734935760498e-06, 5.122274160385132e-06, 5.304813385009766e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 10.0, 4.0, 9.0, 9.0, 16.0, 12.0, 26.0, 46.0, 63.0, 148.0, 299.0, 583.0, 1240.0, 3687.0, 12774.0, 69003.0, 716778.0, 208226.0, 25607.0, 6305.0, 2117.0, 794.0, 355.0, 170.0, 99.0, 53.0, 30.0, 28.0, 14.0, 9.0, 6.0, 15.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.0238037109375, -0.023172855377197266, -0.02254199981689453, -0.021911144256591797, -0.021280288696289062, -0.020649433135986328, -0.020018577575683594, -0.01938772201538086, -0.018756866455078125, -0.01812601089477539, -0.017495155334472656, -0.016864299774169922, -0.016233444213867188, -0.015602588653564453, -0.014971733093261719, -0.014340877532958984, -0.01371002197265625, -0.013079166412353516, -0.012448310852050781, -0.011817455291748047, -0.011186599731445312, -0.010555744171142578, -0.009924888610839844, -0.00929403305053711, -0.008663177490234375, -0.00803232192993164, -0.007401466369628906, -0.006770610809326172, -0.0061397552490234375, -0.005508899688720703, -0.004878044128417969, -0.004247188568115234, -0.0036163330078125, -0.0029854774475097656, -0.0023546218872070312, -0.0017237663269042969, -0.0010929107666015625, -0.0004620552062988281, 0.00016880035400390625, 0.0007996559143066406, 0.001430511474609375, 0.0020613670349121094, 0.0026922225952148438, 0.003323078155517578, 0.0039539337158203125, 0.004584789276123047, 0.005215644836425781, 0.005846500396728516, 0.00647735595703125, 0.007108211517333984, 0.007739067077636719, 0.008369922637939453, 0.009000778198242188, 0.009631633758544922, 0.010262489318847656, 0.01089334487915039, 0.011524200439453125, 0.01215505599975586, 0.012785911560058594, 0.013416767120361328, 0.014047622680664062, 0.014678478240966797, 0.015309333801269531, 0.015940189361572266, 0.016571044921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 9.0, 7.0, 14.0, 24.0, 25.0, 40.0, 55.0, 83.0, 120.0, 142.0, 104.0, 98.0, 66.0, 49.0, 37.0, 33.0, 21.0, 15.0, 12.0, 15.0, 10.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0195770263671875, -0.018964529037475586, -0.018352031707763672, -0.017739534378051758, -0.017127037048339844, -0.01651453971862793, -0.015902042388916016, -0.015289545059204102, -0.014677047729492188, -0.014064550399780273, -0.01345205307006836, -0.012839555740356445, -0.012227058410644531, -0.011614561080932617, -0.011002063751220703, -0.010389566421508789, -0.009777069091796875, -0.009164571762084961, -0.008552074432373047, -0.007939577102661133, -0.007327079772949219, -0.006714582443237305, -0.006102085113525391, -0.0054895877838134766, -0.0048770904541015625, -0.0042645931243896484, -0.0036520957946777344, -0.0030395984649658203, -0.0024271011352539062, -0.0018146038055419922, -0.0012021064758300781, -0.0005896091461181641, 2.288818359375e-05, 0.0006353855133056641, 0.0012478828430175781, 0.0018603801727294922, 0.0024728775024414062, 0.0030853748321533203, 0.0036978721618652344, 0.0043103694915771484, 0.0049228668212890625, 0.0055353641510009766, 0.006147861480712891, 0.006760358810424805, 0.007372856140136719, 0.007985353469848633, 0.008597850799560547, 0.009210348129272461, 0.009822845458984375, 0.010435342788696289, 0.011047840118408203, 0.011660337448120117, 0.012272834777832031, 0.012885332107543945, 0.01349782943725586, 0.014110326766967773, 0.014722824096679688, 0.015335321426391602, 0.015947818756103516, 0.01656031608581543, 0.017172813415527344, 0.017785310745239258, 0.018397808074951172, 0.019010305404663086, 0.019622802734375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 11.0, 19.0, 32.0, 46.0, 97.0, 155.0, 259.0, 160.0, 86.0, 55.0, 31.0, 14.0, 12.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7350334525108337, -0.7178519368171692, -0.7006704807281494, -0.6834889650344849, -0.6663074493408203, -0.6491259336471558, -0.631944477558136, -0.6147629618644714, -0.5975815057754517, -0.5803999900817871, -0.5632185339927673, -0.5460370182991028, -0.5288555026054382, -0.5116740465164185, -0.4944925308227539, -0.47731101512908936, -0.4601294994354248, -0.44294801354408264, -0.4257664978504181, -0.4085850119590759, -0.3914034962654114, -0.3742220103740692, -0.35704052448272705, -0.3398590087890625, -0.32267752289772034, -0.3054960370063782, -0.2883145213127136, -0.27113303542137146, -0.2539515495300293, -0.23677003383636475, -0.21958854794502258, -0.20240704715251923, -0.18522551655769348, -0.16804401576519012, -0.15086251497268677, -0.1336810290813446, -0.11649952828884125, -0.09931802749633789, -0.08213653415441513, -0.06495504081249237, -0.047773540019989014, -0.030592042952775955, -0.013410545885562897, 0.0037709511816501617, 0.02095244824886322, 0.03813394904136658, 0.05531544238328934, 0.0724969357252121, 0.08967843651771545, 0.10685993731021881, 0.12404143065214157, 0.14122292399406433, 0.1584044247865677, 0.17558592557907104, 0.1927674114704132, 0.20994891226291656, 0.22713041305541992, 0.24431191384792328, 0.26149341464042664, 0.2786749005317688, 0.29585641622543335, 0.3130379021167755, 0.3302193880081177, 0.3474009037017822, 0.3645823895931244]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 5.0, 8.0, 8.0, 12.0, 24.0, 16.0, 21.0, 24.0, 28.0, 30.0, 30.0, 22.0, 51.0, 48.0, 55.0, 50.0, 115.0, 59.0, 56.0, 51.0, 43.0, 33.0, 31.0, 36.0, 21.0, 27.0, 18.0, 18.0, 20.0, 9.0, 5.0, 7.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.35718709230422974, -0.3476164937019348, -0.3380458950996399, -0.32847529649734497, -0.31890472769737244, -0.3093341290950775, -0.2997635304927826, -0.29019293189048767, -0.28062233328819275, -0.2710517346858978, -0.2614811360836029, -0.25191056728363037, -0.24233995378017426, -0.23276937007904053, -0.2231987714767456, -0.21362817287445068, -0.20405758917331696, -0.19448699057102203, -0.1849164068698883, -0.17534580826759338, -0.16577520966529846, -0.15620461106300354, -0.1466340273618698, -0.1370634287595749, -0.12749284505844116, -0.11792225390672684, -0.10835165530443192, -0.09878106415271759, -0.08921046555042267, -0.07963987439870834, -0.07006928324699402, -0.0604986846446991, -0.050928086042404175, -0.04135749116539955, -0.03178689628839493, -0.022216305136680603, -0.01264571025967598, -0.003075115382671356, 0.006495475769042969, 0.01606607437133789, 0.025636665523052216, 0.03520726040005684, 0.04477785527706146, 0.05434844642877579, 0.06391903758049011, 0.07348963618278503, 0.08306022733449936, 0.09263082593679428, 0.1022014170885086, 0.11177200824022293, 0.12134260684251785, 0.13091319799423218, 0.1404837965965271, 0.15005439519882202, 0.15962497889995575, 0.16919557750225067, 0.1787661612033844, 0.18833675980567932, 0.19790734350681305, 0.20747794210910797, 0.2170485407114029, 0.22661912441253662, 0.23618972301483154, 0.24576032161712646, 0.2553309202194214]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 12.0, 9.0, 12.0, 22.0, 8.0, 34.0, 29.0, 33.0, 28.0, 36.0, 53.0, 179.0, 266.0, 73.0, 34.0, 33.0, 24.0, 15.0, 16.0, 17.0, 7.0, 8.0, 9.0, 8.0, 4.0, 7.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06005859375, -0.057923316955566406, -0.05578804016113281, -0.05365276336669922, -0.051517486572265625, -0.04938220977783203, -0.04724693298339844, -0.045111656188964844, -0.04297637939453125, -0.040841102600097656, -0.03870582580566406, -0.03657054901123047, -0.034435272216796875, -0.03229999542236328, -0.030164718627929688, -0.028029441833496094, -0.0258941650390625, -0.023758888244628906, -0.021623611450195312, -0.01948833465576172, -0.017353057861328125, -0.015217781066894531, -0.013082504272460938, -0.010947227478027344, -0.00881195068359375, -0.006676673889160156, -0.0045413970947265625, -0.0024061203002929688, -0.000270843505859375, 0.0018644332885742188, 0.0039997100830078125, 0.006134986877441406, 0.008270263671875, 0.010405540466308594, 0.012540817260742188, 0.014676094055175781, 0.016811370849609375, 0.01894664764404297, 0.021081924438476562, 0.023217201232910156, 0.02535247802734375, 0.027487754821777344, 0.029623031616210938, 0.03175830841064453, 0.033893585205078125, 0.03602886199951172, 0.03816413879394531, 0.040299415588378906, 0.0424346923828125, 0.044569969177246094, 0.04670524597167969, 0.04884052276611328, 0.050975799560546875, 0.05311107635498047, 0.05524635314941406, 0.057381629943847656, 0.05951690673828125, 0.061652183532714844, 0.06378746032714844, 0.06592273712158203, 0.06805801391601562, 0.07019329071044922, 0.07232856750488281, 0.0744638442993164, 0.07659912109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 14.0, 27.0, 37.0, 67.0, 109.0, 196.0, 441.0, 1178.0, 5243.0, 72887.0, 8292191.0, 12555.0, 2318.0, 697.0, 289.0, 132.0, 74.0, 38.0, 26.0, 21.0, 10.0, 8.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2614518105983734, -0.2501899302005768, -0.23892806470394135, -0.22766618430614471, -0.21640431880950928, -0.20514243841171265, -0.19388055801391602, -0.18261867761611938, -0.17135681211948395, -0.16009493172168732, -0.14883306622505188, -0.13757118582725525, -0.12630930542945862, -0.11504743993282318, -0.10378555953502655, -0.09252368658781052, -0.08126181364059448, -0.06999994069337845, -0.058738064020872116, -0.047476187348365784, -0.03621431440114975, -0.024952441453933716, -0.013690561056137085, -0.002428688108921051, 0.008833184838294983, 0.020095059648156166, 0.03135693445801735, 0.04261881113052368, 0.053880684077739716, 0.06514255702495575, 0.07640443742275238, 0.08766631036996841, 0.09892818331718445, 0.11019005626440048, 0.12145192921161652, 0.13271380960941315, 0.14397567510604858, 0.15523755550384521, 0.16649943590164185, 0.17776131629943848, 0.1890231817960739, 0.20028506219387054, 0.21154692769050598, 0.2228088080883026, 0.23407068848609924, 0.24533255398273468, 0.2565944194793701, 0.26785629987716675, 0.2791181802749634, 0.29038006067276, 0.30164194107055664, 0.31290382146835327, 0.3241656720638275, 0.33542755246162415, 0.3466894328594208, 0.3579513132572174, 0.36921316385269165, 0.3804750442504883, 0.3917369246482849, 0.40299880504608154, 0.4142606556415558, 0.4255225360393524, 0.43678441643714905, 0.4480462968349457, 0.4593081772327423]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 9.0, 4.0, 8.0, 2.0, 3.0, 5.0, 3.0, 3.0, 2.0, 5.0, 4.0, 3.0, 3.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2817419767379761, -0.2738223373889923, -0.26590266823768616, -0.2579830288887024, -0.25006338953971863, -0.24214373528957367, -0.2342240810394287, -0.22630444169044495, -0.21838480234146118, -0.21046514809131622, -0.20254550874233246, -0.1946258544921875, -0.18670621514320374, -0.17878656089305878, -0.17086690664291382, -0.16294726729393005, -0.1550276130437851, -0.14710795879364014, -0.13918831944465637, -0.1312686651945114, -0.12334902584552765, -0.11542937159538269, -0.10750972479581833, -0.09959007799625397, -0.0916704311966896, -0.08375078439712524, -0.07583113759756088, -0.06791149079799652, -0.05999184027314186, -0.0520721934735775, -0.04415254294872284, -0.03623289614915848, -0.02831326425075531, -0.02039361745119095, -0.012473968788981438, -0.004554320126771927, 0.0033653266727924347, 0.011284973472356796, 0.019204623997211456, 0.027124270796775818, 0.03504391759634018, 0.04296356439590454, 0.0508832111954689, 0.05880286172032356, 0.06672251224517822, 0.07464215159416199, 0.08256180584430695, 0.09048145264387131, 0.09840109944343567, 0.10632074624300003, 0.11424039304256439, 0.12216004729270935, 0.13007968664169312, 0.13799934089183807, 0.14591899514198303, 0.1538386344909668, 0.16175827383995056, 0.16967792809009552, 0.17759756743907928, 0.18551722168922424, 0.193436861038208, 0.20135651528835297, 0.20927616953849792, 0.2171958088874817, 0.22511546313762665]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 7.0, 5.0, 9.0, 10.0, 10.0, 16.0, 25.0, 21.0, 32.0, 32.0, 55.0, 54.0, 59.0, 62.0, 82.0, 74.0, 55.0, 47.0, 55.0, 57.0, 41.0, 51.0, 26.0, 26.0, 18.0, 10.0, 15.0, 13.0, 3.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.032257080078125, -0.03121471405029297, -0.030172348022460938, -0.029129981994628906, -0.028087615966796875, -0.027045249938964844, -0.026002883911132812, -0.02496051788330078, -0.02391815185546875, -0.02287578582763672, -0.021833419799804688, -0.020791053771972656, -0.019748687744140625, -0.018706321716308594, -0.017663955688476562, -0.01662158966064453, -0.0155792236328125, -0.014536857604980469, -0.013494491577148438, -0.012452125549316406, -0.011409759521484375, -0.010367393493652344, -0.009325027465820312, -0.008282661437988281, -0.00724029541015625, -0.006197929382324219, -0.0051555633544921875, -0.004113197326660156, -0.003070831298828125, -0.0020284652709960938, -0.0009860992431640625, 5.626678466796875e-05, 0.0010986328125, 0.0021409988403320312, 0.0031833648681640625, 0.004225730895996094, 0.005268096923828125, 0.006310462951660156, 0.0073528289794921875, 0.008395195007324219, 0.00943756103515625, 0.010479927062988281, 0.011522293090820312, 0.012564659118652344, 0.013607025146484375, 0.014649391174316406, 0.015691757202148438, 0.01673412322998047, 0.0177764892578125, 0.01881885528564453, 0.019861221313476562, 0.020903587341308594, 0.021945953369140625, 0.022988319396972656, 0.024030685424804688, 0.02507305145263672, 0.02611541748046875, 0.02715778350830078, 0.028200149536132812, 0.029242515563964844, 0.030284881591796875, 0.031327247619628906, 0.03236961364746094, 0.03341197967529297, 0.034454345703125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 3.0, 12.0, 15.0, 34.0, 41.0, 81.0, 107.0, 229.0, 491.0, 1284.0, 3765.0, 14785.0, 110718.0, 341034.0, 40030.0, 7543.0, 2266.0, 859.0, 419.0, 207.0, 112.0, 78.0, 41.0, 34.0, 16.0, 19.0, 9.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.18359375, -1.1431732177734375, -1.102752685546875, -1.0623321533203125, -1.02191162109375, -0.9814910888671875, -0.941070556640625, -0.9006500244140625, -0.8602294921875, -0.8198089599609375, -0.779388427734375, -0.7389678955078125, -0.69854736328125, -0.6581268310546875, -0.617706298828125, -0.5772857666015625, -0.536865234375, -0.4964447021484375, -0.456024169921875, -0.4156036376953125, -0.37518310546875, -0.3347625732421875, -0.294342041015625, -0.2539215087890625, -0.2135009765625, -0.1730804443359375, -0.132659912109375, -0.0922393798828125, -0.05181884765625, -0.0113983154296875, 0.029022216796875, 0.0694427490234375, 0.10986328125, 0.1502838134765625, 0.190704345703125, 0.2311248779296875, 0.27154541015625, 0.3119659423828125, 0.352386474609375, 0.3928070068359375, 0.4332275390625, 0.4736480712890625, 0.514068603515625, 0.5544891357421875, 0.59490966796875, 0.6353302001953125, 0.675750732421875, 0.7161712646484375, 0.756591796875, 0.7970123291015625, 0.837432861328125, 0.8778533935546875, 0.91827392578125, 0.9586944580078125, 0.999114990234375, 1.0395355224609375, 1.0799560546875, 1.1203765869140625, 1.160797119140625, 1.2012176513671875, 1.24163818359375, 1.2820587158203125, 1.322479248046875, 1.3628997802734375, 1.4033203125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 9.0, 12.0, 11.0, 20.0, 27.0, 32.0, 45.0, 31.0, 65.0, 70.0, 88.0, 86.0, 84.0, 88.0, 78.0, 65.0, 56.0, 35.0, 35.0, 23.0, 15.0, 14.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.085693359375, -0.0831766128540039, -0.08065986633300781, -0.07814311981201172, -0.07562637329101562, -0.07310962677001953, -0.07059288024902344, -0.06807613372802734, -0.06555938720703125, -0.06304264068603516, -0.06052589416503906, -0.05800914764404297, -0.055492401123046875, -0.05297565460205078, -0.05045890808105469, -0.047942161560058594, -0.0454254150390625, -0.042908668518066406, -0.04039192199707031, -0.03787517547607422, -0.035358428955078125, -0.03284168243408203, -0.030324935913085938, -0.027808189392089844, -0.02529144287109375, -0.022774696350097656, -0.020257949829101562, -0.01774120330810547, -0.015224456787109375, -0.012707710266113281, -0.010190963745117188, -0.007674217224121094, -0.005157470703125, -0.0026407241821289062, -0.0001239776611328125, 0.0023927688598632812, 0.004909515380859375, 0.007426261901855469, 0.009943008422851562, 0.012459754943847656, 0.01497650146484375, 0.017493247985839844, 0.020009994506835938, 0.02252674102783203, 0.025043487548828125, 0.02756023406982422, 0.030076980590820312, 0.032593727111816406, 0.0351104736328125, 0.037627220153808594, 0.04014396667480469, 0.04266071319580078, 0.045177459716796875, 0.04769420623779297, 0.05021095275878906, 0.052727699279785156, 0.05524444580078125, 0.057761192321777344, 0.06027793884277344, 0.06279468536376953, 0.06531143188476562, 0.06782817840576172, 0.07034492492675781, 0.0728616714477539, 0.07537841796875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 8.0, 16.0, 17.0, 15.0, 17.0, 24.0, 22.0, 52.0, 51.0, 42.0, 47.0, 48.0, 23.0, 23.0, 12.0, 11.0, 14.0, 5.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15517164766788483, -0.15032774209976196, -0.1454838365316391, -0.14063993096351624, -0.13579602539539337, -0.1309521198272705, -0.12610821425914764, -0.12126430869102478, -0.11642040312290192, -0.11157649755477905, -0.10673259198665619, -0.10188868641853333, -0.09704478085041046, -0.0922008752822876, -0.08735696971416473, -0.08251306414604187, -0.077669158577919, -0.07282525300979614, -0.06798134744167328, -0.06313744187355042, -0.05829353630542755, -0.05344963073730469, -0.048605725169181824, -0.04376181960105896, -0.038917914032936096, -0.03407400846481323, -0.02923010289669037, -0.024386197328567505, -0.01954229176044464, -0.014698386192321777, -0.009854480624198914, -0.00501057505607605, -0.00016666948795318604, 0.004677236080169678, 0.009521141648292542, 0.014365047216415405, 0.01920895278453827, 0.024052858352661133, 0.028896763920783997, 0.03374066948890686, 0.038584575057029724, 0.04342848062515259, 0.04827238619327545, 0.053116291761398315, 0.05796019732952118, 0.06280410289764404, 0.0676480084657669, 0.07249191403388977, 0.07733581960201263, 0.0821797251701355, 0.08702363073825836, 0.09186753630638123, 0.09671144187450409, 0.10155534744262695, 0.10639925301074982, 0.11124315857887268, 0.11608706414699554, 0.12093096971511841, 0.12577487528324127, 0.13061878085136414, 0.135462686419487, 0.14030659198760986, 0.14515049755573273, 0.1499944031238556, 0.15483830869197845]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 7.0, 4.0, 7.0, 11.0, 8.0, 11.0, 11.0, 12.0, 15.0, 53.0, 87.0, 99.0, 44.0, 14.0, 18.0, 12.0, 11.0, 11.0, 6.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20371556282043457, -0.19731774926185608, -0.19091995060443878, -0.18452215194702148, -0.178124338388443, -0.1717265248298645, -0.1653287261724472, -0.1589309275150299, -0.15253311395645142, -0.14613530039787292, -0.13973750174045563, -0.13333970308303833, -0.12694188952445984, -0.12054408341646194, -0.11414627730846405, -0.10774847120046616, -0.10135066509246826, -0.09495285898447037, -0.08855505287647247, -0.08215724676847458, -0.07575944066047668, -0.06936163455247879, -0.0629638284444809, -0.056566022336483, -0.05016821622848511, -0.04377041012048721, -0.03737260401248932, -0.030974797904491425, -0.02457699179649353, -0.018179185688495636, -0.011781379580497742, -0.005383573472499847, 0.0010142326354980469, 0.007412038743495941, 0.013809844851493835, 0.02020765095949173, 0.026605457067489624, 0.03300326317548752, 0.03940106928348541, 0.04579887539148331, 0.0521966814994812, 0.058594487607479095, 0.06499229371547699, 0.07139009982347488, 0.07778790593147278, 0.08418571203947067, 0.09058351814746857, 0.09698132425546646, 0.10337913036346436, 0.10977693647146225, 0.11617474257946014, 0.12257254868745804, 0.12897035479545593, 0.13536816835403442, 0.14176596701145172, 0.14816376566886902, 0.1545615792274475, 0.160959392786026, 0.1673571914434433, 0.1737549901008606, 0.1801528036594391, 0.18655061721801758, 0.19294841587543488, 0.19934621453285217, 0.20574402809143066]}} \ No newline at end of file